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HUMAN TELOMERASE j 

1 • 

ATGCCGCGCGCTCCCCGCTGCCGAGCCGTGCGCTCCCTGCTGCGCAGCCACTACCGCGAG 60 

MetProArgAlaProArgCysArgAlaValArgSerLeuLeuArgSerHisTyrArgGlu 20 

GTGCTGCCGCTGGCCACGTTCGTGCGGCGCCTGGGGCCCCAGGGCTGGCGGCTGGTGCAG 120 

ValLeuProLeuAlaThrPheValArgArgLeuGlyProGlnGlyTrpArgLeuValGln 40 

CGCGGGGACCCGGCGGCTTTCCGCGCGCTGGTGGCCCAGTGCCTGGTGTGCGTGCCCTGG 180 

ArgGlyAspProAlaAlaPheArgAlaLeuValAlaGlnCysLeuValCysValProTrp 60 

GACGCACGGCCGCCCCCCGCCGCCCCCTCCTTCCGCCAGGTGTCCTGCCTGAAGGAGCTG 24 0 

AspAlaArgProProProAlaAlaProSerPheArgGlnValSerCysLeuLysGluLeu 80 

GTGGCCCGAGTGCTGCAGAGGCTGTGCGAGCGCGGCGCGAAGAACGTGCTGGCCTTCGGC 300 

ValAlaArgValLeuGlnArgLeuCysGluArgGlyAlaLysAsnValLeuAlaPheGly 100 

TTCGCGCTGCTGGACGGGGCCCGCGGGGGCCCCCCCGAGGCCTTCACCACCAGCGTGCGC 360 

PheAlaLeuLeuAspGlyAlaArgGlyGlyProProGluAlaPheThrThrSerValArg 120 

AGCTACCTGCCCAACACGGTGACCGACGCACTGCGGGGGAGCGGGGCGTGGGGGCTGCTG 420 

SerTyrLeuProAsnThrValThrAspAiaLeuArgGlySerGlyAlaTrpGlyLeuLeu 140 

TTGCGCCGCGTGGGCGACGACGTGCTGGTTCACCTGCTGGCACGCTGCGCGCTCTTTGTG 480 

LeiiArgArgValGlyAspAspValLeuValHisLeuLeuAlaArgCysAlaLeuPheVal 160 

CTGGTGGCTCCCAGCTGCGCCTACCAGGTGTGCGGGCCGCCGCTGTACCAGCTCGGCGCT 540 

LeuValAlaProSerCysAlaTyrGInValCysGlyProProLeuTyrGlnLeuGlyAla 18 0 

> ■ • • 

GCCACTCAGGCCCGGCCCCCGCCACACGCTAGTGGACCCCGAAGGCGTCTGGGATGCGAA 600 

AlaThrGlnAlaArgProProProHisAlaSerGlyProArgArgArgLeuGlyCysGlu 200 

CGGGCCTGGAACCATAGCGTCAGGGAGGCCGGGGTCCCCCTGGGCCTGCCAGCCCCGGGT 660 

ArgAlaTrpAsnHisSerValArgGluAiaGlyValProLeuGlyLeuProAlaProGly 220 

• • * * " 

GCGAGGAGGCGCGGGGGCAGTGCCAGCCGAAGTCTGCCGTTGCCCAAGAGGCCCAGGCGT 720 

AlaArgArgArgGlyGlySerAlaSerArgSerLeuProLeuProLysArgProArgArg 240 
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• * • • • • 

GGCGCTGCCCCTGAGCCGGAGCGGACGCCCGTTGGGCAGGGGTCCTGGGCCCACCCGGGC 780 

GlyAlaAlaProGluProGluArgThrProValGlyGlnGlySerTrpAiaHisProGly 260 

• • • • • • 

AGGACGCGTGGACCGAGTGACCGTGGTTTCTGTGTGGTGTCACCTGCCAGACCCGCCGAA 840 

ArgThrArgGlyProSerAspArgGlyPheCysValValSerProAlaArgProAlaGlu 280 

■ • • • • • 

GAAGCCACCTCTTTGGAGGGTGCGCTCTCTGGCACGCGCCACTCCCACCCATCCGTGGGC 900 

GluAlaThrSerLeuGluGlyAlaLeuSerGlyThrArgHiaSerHisProSerValGly 300 

• • * * • • 

CGCCAGCACCACGCGGGCCCCCCATCCACATCGCGGCCACCACGTCCCTGGGACACGCCT 960 

ArgGlnHisHisAlaGlyProProSerThrSerArgProProArgProTrpAspThrPro 320 

• • • • • .* 

TGTCCCCCGGTGTACGCCGAGACCAAGCACTTCCTCTACTCCTCAGGCGACAAGGAGCAG ' 1020 

CysProProValTyrAlaGluThrLysKisPheLeuTyrSerSerGlyAspLysGluGln 340 

• • • • • • 

CTGCGGCCCTCCTTCCTACTCAGCTCTCTGAGGCCCAGCCTGACTGGCGCTCGGAGGCTC 108 0 

LeuArgProSerPheLeuLeuSerSerLeuArgProSerLeuThrGlyAlaArgArgLeu 360 

• • • > . . 

GTGGAGACCATCTTTCTGGGTTCCAGGCCCTGGATGCCAGGGACTCCCCGCAGGTTGCCC 1140 

ValGluThrllePheLeuGlySerArgPrcTrpMenProGlyThrProArgArgLeuPro 380 

v • • * • # • 

CGCCTGCCCCAGCGCTACTGGCAAATGCGGCCCCTGTTTCTGGAGCTGCTTGGGAACCAC 1200 

ArgLeuProGlnArgTyrTrpGlnMetArgProLeuPheLeuGluLeuLeuGlyAsnHis 400 

• • * • • • 

GCGCAGTGCCCCTACGGGGTGCTCCTCAAGACGCACTGCCCGCTGCGAGCTGCGGTCACC 1260 

AlaGlnCysProTyrGlyValLeuLeuLysThrHisCysProLeuArgAlaAlaValThr 420 

• • * • • • 

CCAGCAGCCGGTGTCTGTGCCCGGGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCGAGGAG 1320 

ProAlaAlaGlyValCysAlaArgGluLysProGlnGlySerValAlaAlaProGluGlu 44 0 

GAGGACACAGACCCCCGTCGCCTGGTGCAGCTGCTCCGCCAGCACAGCAGCCCCTGGCAG 1380 

GlxjAspThrAspProArgArgLeuValGlnLeuLeuArgGlnHisSerSerProTrpGln 4 60 

■ • • • ■ a 

GTGTACGGCTTCGTGCGGGCCTGCCTGCGCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCC 1440 

ValTyrGlyPheValArgAlaCysLeuArgArgLeuValProProGlyLeuTrpGlySer 480 

> • • • a • 

AGGCACAACGAACGCCGCTTCCTCAGGAACACCAAGAAGTTCATCTCCCTGGGGAAGCAT 1500 

ArgHiaAsnGluArgArgPheLeuArgAsnThrLysLysPhelleSerLeuGlyLysHis 500 
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*.;3 



GCCAAGCTCTCGCTGCAGGAGCTGACGTGGAAGATGAGCGTGCGGGGCTGCGCTTGGCTG 1560 

AlaLysLeuSerLeuGlnGliiLeuThrTrpLyaMetSerValArgAspCysAlaTrpLeu 520 

• ••••• 

CGCAGGAGCCCAGGGGTTGGCTGTGTTCCGGCCGCAGAGCACCGTCTGCGTGAGGAGATC 1620 

ArgArgSerProGlyValGlyCysValProAlaAlaGluHisArgLeuArgGluGluIle 540 

• • • • • « 

CTGGCCAAGTTCCTGCACTGGCTGATGAGTGTGTACGTCGTCGAGCTGCTCAGGTCTTTC 1680 

LeuAlaLysPheLeuHiaTrpLeuMetSerValTyrValValGluLeuLeuArgSerPhe 560 

• • • . ♦ 

TTTTATGTCACGGAGACCACGTTTCAAAAGAACAGGCTCTTTTTCTACCGGAAGAGTGTC 1740 

PheTyrValThrGluThrThrPheGlnLysAsnArgLeuPhePheTyrArgLysSerVal 580 

TGGAGCAAGTTGCAAAGCATTGGAATCAGACAGCACTTGAAGAGGGTGCAGCTGCGGGAG 1800 

TrpSerLysLeuGlnSerlleGlylleArgGlnHisLeuLysArgValGlnLeuArgGlu 600 

• • . • • . , 

CTGTCGGAAGCAGAGGTCAGGCAGCATCGGGAAGCCAGGCCCGCCCTGCTGACGTCCAGA 1860 

LeuSerGluAlaGluValArgGlnHisArgGluAlaArgProAlaLeuLeuThrSerArg 620 



U CTCCGCTTCATCCCCAAGCCTGACGGGCTGCGGCCGATTGTGAACATGGACTACGTCGTG 1920 

\U LeuArgPhelleProLysProAspGlyLeuArgProIleValAsnMetAspTyrValVal 640 



GGAGCCAGAACGTTCCGCAGAGAAAAGAGGGCCGAGCGTCTCACCTCGAGGGTGAAGGCA 1980 

GlyAlaArgThrPheArgArgGluLysArgAiaGluArgLeuThrSerArgValLysAla 660 

• * • • • • 

CTGTTCAGCGTGCTCAACTACGAGCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTCTGTG 204 0 

LeuPheSerValLeuAsnTyrGluArgAIaArgArgProGlyLeuLeuGlyAlaSerVal 680 

• • • • • • 

CTGGGCCTGGACGATATCCACAGGGCCTGGCGCACCTTCGTGCTGCGTGTGCGGGCCCAG 2100 

LeuGlyLeuAapAspIleHiaArgAlaTrpArgThrPheValLeuArgValArgAlaGln 700 

• • • ... 

GACCCGCCGCCTGAGCTGTACTTTGTCAAGGTGGATGTGACGGGCGCGTACGACACCATC 2160 

AspProProProGluLeuTyrPheValLysVaiAspValThrGlyAlaTyrAspThrlle 720 

• * ... 

CCCCAGGACAGGCTCACGGAGGTCATCGCCAGCATCATCAAACCCCAGAACACGTACTGC 2220 

ProGlnAspArgLeuThrGluVallleAlaSerllelleLysProGlnAsnThrTyrCys 74 0 

• • . . 

GTGCGTCGGTATGCCGTGGTCCAGAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAG 2280 

ValArgArgTyrAlaValValGlnLysAlaAlaHisGlyHisValArgLysAlaPheLys 760 
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AGCCACGTCTCTACCTTGACAGACCTCCAGCCGTACATGCGACAGTTCGTGGCTCACCTG 2340 

SerHiaValSerThrLeuThrAspLeuGlnProTyrMetArgGlnPheValAlaHisLeu 78 0 

CAGGAGACCAGCCCGCTGAGGGATGCCGTCGTCATCGAGCAGAGCTCCTCCCTGAATGAG 2400 

GlnGluThrSerProLeuArgAspAlaValVallleGluGlnSerSerSerLeuAsnGlu 800 

GCCAGCAGTGGCCTCTTCGACGTCTTCCTACGCTTCATGTGCCACCACGCCGTGCGCATC 2460 

AlaSerSerGlyLeuPheAspValPheLeuArgPheMetCysHisHisAlaValArglle 820 

AGGGGCAAGTCCTACGTCCAGTGCCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTG 2520 

ArgGlyLysSerTyrValGlnCysGlnGlylleProGlnGlySerlleLeuSerThrLeu 840 

CTCTGCAGCCTGTGCTACGGCGACATGGAGAACAAGCTGTTTGCGGGGATTCGGCGGGAC 2580 

LeuCysSerLeuCysTyrGlyAspMetGluAaaLysLeuPheAlaGlylleArgArgAap 860 

GGGCTGC^CCTGCGTT-TGGTGGATGATT'TCTTGTTGGTGACACCTCACCTCACCCACGCG 2640 

GlyLeuLeuLeuArgLeuValAspAspPheLeuLeuValThrProHisLeuThrHisAla 880 

* • • * 

AAAACCTTCCTCAGGACCCTGGTCCGAGGTGTCCCTGAGTATGGCTGCGTGGTGAACTTG 2700 

LysThrPheLeuArgThrLeuValArgGlyValProGluTyrGlyCysValValAsnLeu 900 

CGGAAGACAGTGGTGAACTTCCCTGTAGAAGACGAGGCCCTGGGTGGCACGGCTTTTGTT 27 60 

ArgLysThrValValAsnPheProValGluAspGluAlaLeuGlyGlyThrAlaPheVal 920 

CAGATGCCGGCCCACGGCCTATTCCCCTGGTGCGGCCTGCTGCTGGATACCCGGACCCTG 2820 

GlnMetProAlaHisGlyLeuPheProTrpCyaGIyLeuLeuLeuAspThrArgThrLeu 940 

GAGGTGCAGAGCGACTACTCCAGCTATGCCCGGACCTCCATCAGAGCCAGTCTCACCTTC 2880 

GluValGlnSerAspTyrSerSerTyrAlaArgThrSerlleArgAlaSerLeuThrPhe 960 

AACCGCGGCTTCAAGGCTGGGAGGAACATGCGTCGCAAACTCTTTGGGGTCTTGCGGCTG 294 0 

AsnArgGlyPheLysAlaGlyArgAanMetArgArgLysLeuPheGlyValLeuArgLeu 980 

AAGTGTCACAGCCTGTTTCTGGATTTGCAGGTGAACAGCCTCCAGACGGTGTGCACCAAC 3000 

LysCysHisSerLeuPheLeuAspLeuGlnValAsnSerLeuGlnThrValCysThrAan 1000 

ATCTACAAGATCCTCCTGCTGCAGGCGTACAGGTTTCACGCATGTGTGCTGCAGCTCCCA 3060 

IleTyrLysIleLeuLeuLeuGlnAlaTyrArgPheHisAlaCysValLeuGlnLeuPro 1020 
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3120 

^G^Va^^ 1040 



TTTCATCAGCAAGTTTGGAAC3AACCCCACATTTTTCCTGCGCGTCATCTCTGACACGGCC 



3180 

l^^^^i^^^^^^^^^^^^y^ 1060 



TCCCTCTGCTACTCCATCCTGAAAGCCAAGAACGCAGGGATGTCGCTGGGGGCCAAGGGC 



GCCGCCGGCCCTCTGCCCTCCGAGGCCGTGCAGTGGCTGTGCCACCAAGCATTCCTGCTC 3240 

AlaAlaGlyProLeuProSerGluAlaValGlnTrpLeuCysHisGlnAlaPheLeuLeu 1080 

AAGCTGACTCGACACCGTGTCACCTACGTGCCACTCCTGGGGTCACTCAGGACAGCCCAG 3300 

LyaLeuThrArgHisArgValThrTyrValProLeuLeuGlySerLeuArgThrAlaGln 1100 

ACGCAGCTGAGTCGGAAGCTCCCGGGGACGACGCTGACTGCCCTGGAGGCCGCAGCCAAC 3360 

ThrGlnLeuSerArgLysLeuProGlyThrThrLeuThrAlaLeuGluAlaAxaAlaAsn 1120 



ggggggaggtgctgtgggagtaaaa 
aaaa 



3420 
1132 



CCGGCACTGCCCTCAGACTTCAAGACCATCCTGGACtgatggccacccgcccacagccag 
ProAlaLeuProSerAspPheLysThrlleLeuAsp 

Gccgagagcagacaccagcagccctgtcacgccgggctctacgtcccagggagggagggg 3480 

CggLLLcLaggcccgcaccgctgggag^ccgaggcctgagtgagtgtttggccgag 3540 

gcctgcatgtccggctgaaggcrgagtgtccggctgaggcctgagcgagtgtccagccaa 3600 

gg g c?gag?gtccagcacacctgccgtc t tcacttccccacaggc t ggcgctcggctcca 3660 

cJccagggccagctctccctcaccaggagcccggctrccactccccacataggaatagtc 3720 

catcccSgattcgccattgrtcaccccrcgccctgccctcctttgccttccacccccac 3780 

catccagg^ggagLcctgagaaggaccctgggagcrctgggaatttggagtgaccaaag 3840 

atqtgccctgtacacaggcgaggaccctgcaccrggatgggggtcqptgtgggtcaaatt 3900 

9 9 1 ^ a ^ aa «Atactgaatatatgagtttttcagttttgaaaaaaa 3960 



3964 
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sequence "Y" 104-105 bases 

GGCCTCCCCGGGGTCGGCGTCCGGCTGGGGTTGAGGGCGGCCGGGGGGAACCAG 
GlyLeuProGlyValGlyValArgLeuGlyLeuArgAlaAlaGlyGlyAsnGln 
AlaSerProGlySerAlaSerGlyTrpGly * GlyArgProGlyGlyThrSer 
ProProArgGlyArgArgProAlaGlyValGluGlyGlyArgGlyGluProAla 

CGACATGCGGAGAGCAGCGCAGGCGACTCAGGGCGCTTCCCCCGCAGGTG 
ArgHisAlaGluSerSerAlaGlyAspSerGlyArgPheProArgArg 
AspMetArgArgAlaAlaGlnAlaThrGlnGlyAlaSerProAlaGly 
ThrCysGlyGluGlnArgArgArgLeuArgAlaLeuProProGlnVal 

sequence "l" 38 bases 

GTGGCTGTGCTTTGGTTTAAGTTCCTTTTTAACCAGAA 
ValAlaValLeuTrpPheAsnPheLeuPheAsnGlnLys 



sequence "a" 36 bases 

GTGGATGTGACGGGCGCGTACGACACCATCCCCCAG 
ValAspValThrGlyAlaTyrAspThrlleProGln 



sequence ,f fJ" 182 bases 

GTCTCTACCTTGACAGACCTCCAGCCGTACATGCGACAGTTCGTGGCTCACCTG 
ValSerThrLeuThrAspLeuGlnPrcTyrMetArgGlnPheValAlaHisLeu 

CAGGAGACCAGCCCGCTGAGGGATGCCGTCGTCATCGAGCAGAGCTCCTCCCTG 
GlnGluThrSerProLeuArgAspAIaValVallleGluGlnSerSerSerLeu 

AATGAGGCCAGCAGTGGCCTCTTCGACGTCTTCCTACGCTTCATGTGCCACCAC 
AsnGluAlaSerSerGlyLeuPheAspValPheLeuArgPheMetCysHisHiS 

GCCGTGCGCATCAGGGGCAA 
AlaValArglleArgGlyLys 



partial sequence "2" unknown length 

GTGAGCGCACCTGGCCGGAAGTGGAGCCTGTGCCCGGCTGGGGCAGGTGCTGCTGCAG 
Ter 

GGCCGTTGCGTCCACCTCTGCTTCCGTGTGGGGCAGGCGACTGCCAATCCCAAAGGGT 
CAGATGCCACAGGGTGCCCCTCGTCCCATCTGGGGCTGAGCACAAATGCATCTTTCTG 
TGGGAGTGAGGGTGCCTCACAACGGGAGCAGTTTTCTGTGCTATTTTGGTAA.- 



sequence "3" 159 bases 

CCGAAGAAAACATTTCTGTCGTGACTCCTGCGGTGCTTGGGTCGGGACAGCCAGAG 

AlaGluGluAsnlleSerValValThrProAIaValLeuGlySerGlyGlnProGlu 

ATGGAGCCACCCCGCAGACCGTCGGGTGTGGGCAGCTTTCCGGTGTCTCCTGGGAGG 
MetGluProProArgArgProSerGlyValGlySerPheProValSerProGlyArg 

GGAGTTGGGCTGGGCCTGTGACTCCTCAGCCTCTGTTTTCCCCCAG 
GlyValGlyLeuGlyLeu * 
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GACAGTCACCAGGGGGGTTGACCGCCGGACTGGGCGTCCCCAGGGTTGACTATAGGA 
CCAGGTGTCCAGGTGCCCTGCAAGTAGAGGGGCTCTCAGAGGCGTCTGGCTGGCATGG 
GTGGACGTGGCCCCGGGCATGGCCTTCTGCGTGTGCTGCCGTGGGTGCCCTGAGCCCT 
CACTGAGTCGGTGGGGGCTTGTGGCTTCCCGTGAGCTTCCCCCTAGTCTGTTGTCTGG 
CTGAGCAAGCCTCCTGAGGGGCTCTCTATTG 



partial •aqu«nc« of gaaoaic lntxon (approximately 2.7 Ids) 

GTGGCTGTGCTTTGGTTTAACTTCCTTTTTAACCAGAAGTGCGTTTGAGCCCCACATT 
TGGTATCAGCTTAGATGAAGGGCCCGGAGGAGGGGCCACGGGACACAGCCAGGGCCAT 
GGCACGGCGCCCACCCATTTGTGCGCACAGTGAGGTGGCCGAGGTGCCGGTGCCTCCA 
GAAAAGCAGCGTGGGGGTGTAGGGGGAGCTCCTGGGGCAGGGAC 
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N-terminal truncated telomerase 



ATCCCGCGCGlTLXXXAX'i m X J K^^ 

MPRAPRCaAVRSLLRSHTRBVLPLATPV 

CG(XGCCTGOGGCcca«Kxxrrtx3a3GcrGC7rc^^ 

RRI,GPQGWRI.VQRaDPAAFRAI,VAQCLVCVPWDARPPPAA 




G G P P B A PTT S V R S Y L PHTVTDAt»RGSGAWGI*LI»RRVGDDV 




ATCCAC^TCGCGGC»CCACGTCCCTGGGACACGCCTTt7rc^ 
STSRPPRPWDTPCPPVYA3TKHPLYSSGDKEQLRPSPLLS 

CTCTCTGAGGCCCAGCCTGACTGGCGCTCGGAGGCTCGTGGAGACCAT^ 
SI»RPSLTGARRI*VBT I PLGSRPWMPGTPRRL P R L PQRTfMQ 



AATGCGGCCC L 11 1T1 I ll^ G CiXiCi - l l> GGAACCACGCGCAGTGCCCCTACGG 
HRPLFLELLGMHAQCPYGV 



ACGCACTGCCCCCTGCGAGCTGCGGTCACCCCAGCAGCCGGTGTCTGTGCCCG 
LKTHCPLRAAVTPAAGVCAR 



GGAGAAGCCCCAGGGCrCTGTGGCCXXrCCCCG 
8KPQGSVAAP3S33TDPRRLVQLLRQHSSPWQVYGPVRAC 

CCTGCCCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCCAGGCACAACGAACG^ 
LRRLVp pGLWGSRHMBaRPLRMTKK.P I SLGKHAKLSLQSL 



GACGTGGAAGATGAGCGTTXTGGGACTGCGCTTGGCrGCGCAGGAG^ 
TWKMSV RDCAWLRRS PG 7GC7PAAEHRLREE I LAKPLHWL 



GATT^GTGTGTACGTCGTCGAGCTGCTCAGGTCT 
MSVYVVELL 



rTCAAAAGAACAGGCT L ' rri ' 1 ' 1 CTACCGGAAGAGTGTCTGGAGCAAGTTGCAAAGCATTGG 
QKMRLPPYRKSVWS'KLQS IG 



AAT- -NNN- -GACACTTCACC^GGGCXXirrTGACCGCCGG^ 

eATGGGTCGACCTGCCCCCOGGCATGCCCTTCTCCUWr^^ 

GCTGAGCAAGCCTCCTGAGGGGCTCTCTATTG— 



Truncated protein 1 



M PRAPRCRAVRSLI.RSHT 



BVLPLATPV 



CGGCGCCTGGGGCCCCAGGGCrGGCGGCrCGTGCAGCGCGGGG 
RRLGPQGWRLVQRGDPAAPRALVAQCLVCVPWDARPPPAA 



RQV3C LK BLVARVLQRLCERGAKNVLA 



GPALLDGAR 




GCTGGTTCACl 
!• V H L I* A 



CALPVI»VAP3CAYQVCGPPLYQLGAATQARPPP 



ACACGCTAGTGGACCCCGAAGGCGTCTGGGATGCGAACGGGCCTGGAACCAT 
HASGPRRRLGCBRAWMBSVR3AGVPLGLPAPGARRRGGSA 

CAGCCGAAGTCrGC LO 1 ' ll^ CCAAGAGGCCCAGGCGTGGCGClTjCCCCrGAGCCGGaCCGGACGCCCGT^ 
SRSLPLPKRPRRGAAPBP3RTPVGQGSWAHPGRTRGPSDR 

TGu'l'l'rC'Iljl tj 'lWlViX J UrCTGCCAGACCCGCCGAAGAAGCCA ^ 1 !Uj A<aGtT3CXTCirTGGCACGCGCCACTCCCAC^ 
GPCVVSPAR PA33ATS L3 3ALSGTRHSH PSVGRQHHAGPP 



CTCTCI C AGGCCCAGCCTIXSACrGGCGCTCGGAGGC'I C GI G GAGACCAT 
SLRPSLTGARRLV2TI P 



rTCCAGGCCCTGGATCCCACGGACTCCCCGCAGGTTGCC^ 
3RPWMPGTPRRLPRLPQRYWQ 



AATGCGGCCCLltjiTlL'ilXatf^Wi'llGGAACCACGCGC^^ 
MRPLPLBLL0MHAQC?Y3*/LLKTHC?LRAAVTPAAGVCAR 



GGAGAAGCCCCAGGGCTCTGTGGCGGCCCC 
EKPQGSVAAP33 



CSTCSCL 1^' ltj CAGCTGCTCCGCCAGCACAGCAGCCCCTGGCAGGTGTACGGCTTCGTGCGGGCC^ 
VQLLRQHSSPWQVYGPVRAC 



CCTGCGCCGGCTtXTnXCCCCAGGCCTCTGGGGC^ 
LRRLVPPGLWGSRHM3RR7 — R»TKK?ISLGKHAKLSLQBL 



GACGTGGAAGATGAGCGTCCGGGACTGCGCTTGCXrTTX:GCAGCAGC^ 
THKMSVRDCAWLRRSPGV3CVPAA3KRLREEILAKPLHML 



GATGAGTGTGTACGTCGTCGAGCTGCTCAGGTU"I"1'1 <- i i i i. ATGTCACGGAGACCAt. j * . 1 ."^AAAAGAACAGGCTL I CTACCGGAAGAGTGTCTGGAGCAAGTTGCAAAGCATTGG 
MSVYVVBC*LRS??YVT3???QXNRL?PYRXSVW5KLQStG 



AATCAGACAGCAC7TGAAGAGGGTGCAGCTGCGGGAG 
IRQHLKRVQLR2 



7TTTCGCAAGCAGAGGTCAGGCAGCATC:JGGAAGCCAGG^ 

SEA3Y3Q3REARPALLTSRLRFI PKPD 



GTGGCTGTtlCTTTtJGTTTAACTTCCTTTTTAACCAGAA 
VAVL'rfFTPLPNQK 

CGGGCTGCGGCCGATTGTGAACATGGACTACGTCGTGGGAGCCAGAACGTTCCGC^ 
GLRPIVNMDYVVGARTPRR3XR PSVSFRG* 



4 
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Truncated protein 2 



111 



Vii 



hJ 



RCRAVRSLLRS 



TACCGCGAGGTGCTGCCGCTGGCCACGTTCGTG 
TRSVLPLATPV 



RRI,GPQGWRLVGRGDPAAFRALVAQ.CLVCVPWDARPPPAA 



S P R Q V S C 



CCCGAGTGCTGCAGAGGCTGTGCGAGCGCGGCGCGAAGAACGt^^ 
VARVLQRLCBRGAKMVLAPG 



PALL 



CGGO^CCCCCayU^CTR^CACCAGCGTGCGCAGCTA 
GGPPBAPTTSVRSYLPMTVTDALRGSGAWGLLLRRVGDDV 

GCTGGTTCACCTGCIGGCACGCIGCGCGCTCTTTGTGCT^ 
LVHLLARCAL FVLVAPSCAYQVCGPPLYQLGAATQAR P PP 



ACACGCTAGTGGACCCCGAAGGCGTCTGGGATGCGAACGGGCCT 
HASGPRRRLGCBRAWNHS 



VRSAGVPLGLPAPGAR 



CAGCCGAAGTCTGCCGTTGCCCAAGAGGCCCAGGCGTGGCGCTGCCCCTGAGCCG 
3RSLPLPKRPRRGAAPBPBRTPVGQGSWAHPGRTRGPSDR 




CCTTGTCCCCCGGTGTACGCCGAGACCAAGCACTTCCTCTA 
STSRPPRPWDTPCPPVYA3TKHPLYSSGDKEQLRPSFLLS 

CltTICTGAGGCCCAGCCTGACTGGCGCTCGGAGGCTCGT^ 
SLRPSLTGARRLV3TIFLGSRPWMPGTPRRLPRLPQRYWQ 

CGCTGCGAGCTGCCGTCACCCC 
KTHCPLRAAVTPA 

GGAGAAGCCCCAGGGCT^TGTGGCGGCCCCCGAGGAGGAGGACACAGACCCCCGTCGCCTG 
BKPQGSVAAPSES3TDPRRLVQLLRQHSSPWQVYGPVRAC 

ccrrgctccggctggtgcccccaggcctctggggctccaggcacaacgaacg^ 
l'rrl'vppglwgsrhmsrrflrmtkkpislgkhaklslqel 

GACGTGGAA(^TGAGCGTGCGGGACTCX:GCrrGGC-rGCGC^ 
TWKNSVRDCAMLRRS PGVGCVPAAEHRLRES ILAKPLHWL 



GATGAGTGTGTACGTCGTCGAGCTGCTCAGGTCTTT 
MSVYVV3LLRSP 



rTTATCTCACGGAC^CCACGrrrCAAAAGAACAGGCTCTTTTTCTACC 

YVTSTTPQKMRLPP'YRKS V W S KLQS I G 



AATCAGACACXLACTTCLAACLACK3GTG 

iaQHLKRVQLRBLSBASVRQHREARPALLTSRLRP I PKPD 

CGGGCTGCGGCCGATTGTGAAC^TGGACTACCTCGTGGGAG^ 
GL*R? ivsimDYVVGARTPRRBKRABRLTSRVKAL PSVLMYS 

GCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTCTGTGCTGGGCCrG^ 
RARRPGLLGASVLGLDDIHRAWRTPVLRVRAQDPPPSLYP 

TGTCAAGGTGGATGTGACGGGCGCGTACGACACCATCCCCCAGGACAGGCTCA 
VKVDVTGAYDTI PQ DRLT3VIAS I IKPQNTYCVRRYAVVQ 

GAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGCCAC 
KAAHGHVRKAPK5H 

GTCCTACGTCCAGTG 
V L R P V 

ccagoggatcccgcagcgctccatcctctccacgcii^il: 

PGDp W AGLHPLHAALQPVLRRHGEQAVCGDSAGRAAPAPVG 
ACACCT<^CCTCACCCACGCGAAAACCTTCCTCAGGACCCTOTrCCGAGGTCT 
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Reference protein 



ATGCCGCGCGCTCCCCGCTGCCGAGCCGTGCGCT CCCTGCTGCGCAGCCACTACCGCGAG 6 0 

MetProArgAlaProArgCysArgAlaValArgSerLeilLeuArgSerHisTyrArgGlu 20 

GTGCTGCCGCTGGCCACGTTCGTGCGGCGCCTGGGGCCCCAGGGCTGGCGGCTGGTGCAG 120 

ValLeuProLeuAlaThrPheValArgArglieuGlyProGlnGlyTrpArgLeuValGln 40 

CGCGGGGACCCGGCGGCTTTCCGCGCGCTGGTGGCCCAGTGCCTGGTGTGCGTGCCCTGG 180 

ArgGlyAspProAlaAlaPheArgAlaLeuValAlaGlnCysLeuValCysValProTrp 60 

GACGCACGGCCGCCCCCCGCCGCCCCCTCCTTCCGCCAGGTGTCCTGCCTGAAGGAGCTG 240 

AspAlaArgProProProAlaAlaProSerPheArgGlnValSerCysLeuLysGluLeu 80 

GTGGCCCGAGTGCTGCAGAGGCTGTGCGAGCGCGGCGCGAAGAACGTGCTGGCCTTCGGC 300 

ValAlaArgValLeuGlnArgLeuCysGluArgGlyAlaLysAsnValLeuAlaPheGly 100 

TTCGCGCTGCTGGACGGGGCCCGCGGGGGCCCCCCCGAGGCCTTCACCACCAGCGTGCGC 3 60 

PheAlaLeuLeuAspGlyAlaArgGlyGlyProProGluAlaPheThrThrSerValArg 120 

AGCTACCTGCCCAACACGGTGACCGACGCACTGCGGGGGAGCGGGGCGTGGGGGCTGCTG 420 

SerTyrLeuProAsnThrValThrAspAlaLeuArgGlySerGlyAlaTrpGlyLeuLeu 140 

TTGCGCCGCGTGGGCGACGACGTGCTGGTTCACCTGCTGGCACGCTGCGCGCTCTTTGTG 4 80 

LeuArgArgValGlyAspAspValLeuValHisLeuLeuAlaArgCysAlaLeuPheVal 160 

CTGGTGGCTCCCAGCTGCGCCTACCAGGTGTGCGGGCCGCCGCTGTACCAGCTCGGCGCT 54 0 

LeuValAlaProSerCysAlaTyrGlnValCysGlyProProLeuTyrGlnLeuGlyAla 180 

GCCACTCAGGCCCGGCCCCCGCCACACGCTAGTGGACCCCGAAGGCGTCTGGGATGCGAA 6 00 

AlaThrGlnAlaArgProProProHisAlaSerGlyProArgArgArgLeuGlyCysGlu 200 

CGGGC CTGGAAC CAT AG CGT CAGGG AGGC CGGGGT C C C C CTGGGC CTGC CAGC C C CGGGT 660 

ArgAlaTrpAsnHisSerValArgGluAlaGlyValProLeuGlyLeuProAlaProGly 220 

GCGAGGAGGCGCGGGGGCAGTGCCAGCCGAAGTCTGCCGTTGCCCAAGAGGCCCAGGCGT 720 

AlaArgArgArgGlyGlySerAlaSerArgSerLeuProLeuPrcLysArgProArgArg 240 

GGCGCTGCCCCTGAGCCGGAGCGGACGCCCGTTGGGCAGGGGTCCTGGGCCCACCCGGGC 78 0 

GlyAlaAlaProGluProGluArgThrProValGlyGlnGlySerTrpAlaHisProGly 26 0 

AGGACGCGTGGACCGAGTGACCGTGGTTTCTGTGTGGTGTCACCTGCCAGACCCGCCGAA 84 0 

ArgThrArgGlyProSerAspArgGlyPheCysValValSerPrcAlaArgProAlaGlu 28 0 

GAAGCCACCTCTTTGGAGGGTGCGCTCTCTGGCACGCGCCACTCCCACCCATCCGTGGGC 900 

GluAlaThrSerLeuGluGlyAlaLeuSerGlyThrArgHisSerHisProSerValGly 3 00 

CGCCAGCACCACGCGGGCCCCCCATCCACATCGCGGCCACCACGTCCCTGGGACACGCCT 96 0 

ArgGlnHisHisAlaGlyProProSerThrSerArgProProArgProTrpAspThrPro 3 20 

TGTCCCCCGGTGTACGCCGAGACCAAGCACTTCCTCTACTCCTCAGGCGACAAGGAGCAG 1020 

CysProProValTyrAlaGluThrLysHisPheLeuTyrSerSerGlyAspLysGluGln 34 0 

CTGCGGCCCTCCTTCCTACTCAGCTCTCTGAGGCCCAGCCTGACTGGCGCTCGGAGGCTC 10 8 0 

LeuArgProSerPheLeuLeuSerSerLeuArgProSerLeuThrGlyAlaArgArgLeu 3 60 

GTGGAGACCATCTTTCTGGGTTCCAGGCCCTGGATGCCAGGGACTCCCCGCAGGTTGCCC 114 0 

ValGluThrllePheLeuGlySerArgProTrpMecProGlyThrPrcArgArgLeuPro 3 80 

CGCCTGCCCCAGCGCTACTGGCAAATGCGGCCCCTGTTTCTGGAGCTGCTTGGGAACCAC 1200 . 

ArgLeuProGlnArgTyrTrpGlnMetArgProLeuPheLeuGluLeuLeuGlyAsnHis 4 00 

GCGCAGTGCCCCTACGGGGTGCTCCTCAAGACGCACTGCCCGCTGCGAGCTGCGGTCACC 1260 

AlaGlnCysProTyrGlyValLeuLeuLysThrHisCysProLeuArgAlaAlaValThr 420 
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1320 
440 



1380 
460 



CCAGCAGCCGGTGTCTGTGCCCGGGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCGAGGAG 
ProAlaAlaGlyValCysAlaArgGluLysProGlnGlySerValAlaAlaProGluGlu 

GAC3GACACAGACCCCCGTCGCCTGGTGCAGCTGCTCCGCCAGCACAG<^GCCCCTGGCAG 
GluAspThrAspProArgArgLeuValGlnLeuLeuArgGlnHisSerSerProTrpGln 

GTGTACGGCTTCGTGCGGGCCTGCCTGCGCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCC 1440 
ValTyrGlyPheValArgAlaCysLeuArgArgLeuValProProGlyLeuTrpGlySer 480 

AGGCACAACGAACGCCGCTTCCTCAGGAACACCAAGAAGTTCA^ 1500 
ArgHisAsnGluArgArgPheLeuArgAsnThrLysLysPhelleSerLeuGlyLysHis 500 

GCCAAGCTCTCGCTGCAGGAGCTGACGTGGAAGATGAGCGTGCGGGGCTGCGCTTGGCTG 
AlaLysLeuSerLeuGlnGluLeuThrTrpLysMetSerValArgAspCyaAlaTrpLeu 



1560 
520 




CTGGCC^GTTCCTGCACTGGCTGATGAGTGTGTACGTCGTCCJAGCrGCTCAGGTCTTTC 1680 

SuAlaLysPheLeuHisTrpLeuMetSerValTyrValValGluLeuLeuArgSerPhe 560 

TTTTATGTCACGGAGACCACGTTTCAAAAGAACAGGCTCTTTTTCTACCGGAAGAGTGTC 1740 

PheTyrValThrGiuThrThrPheGlnLysAsnArgLeuPhePheTyrArgLysSerVal 580 

TGGAGCAAGTTGCAAAGCATTGGAATCAGACAGCACTTGAAGAGGGTGCAGCTGCGGGAG 1800 

TrpSerLysLeuGlnSerlleGlylleArgGlnHisLeuLysArgValGlnLeuArgGlu 600 

CTGTCGGAAGCAGAGGTCAGGCAGCATCGGGAAGCCAGGCCCGCCCTGCTGACGTCCAGA 1860 

LeuSerGluAlaGluValArgGlnHisArgGloAlaArgProAiaLeuLeuThrSerArg 620 

CTCCGCTTCATCCCCAAGCCTGACGGGCTGCGGCCGATTGTGAACATGGACTACGTCGTC 1920 

LeuArgPhelleProLysProAspGlyLeuArgProIleValAs^ecAspTyrValVal 640 

GGAGCCAGAACGTTCCGCAGAGAAAAGAGGGCCGAGCGTCTCACCTCGAGGGTGAAGGCA 1980 

GlyAlaArgThrPheArgArgGluLysArgAlaGluArgLeuThrSerArgValLysAla 660 

CTGTTCAGCGTGCTCAACTACGAGCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTCTGTG 2040 

LeuPheServalLeuAsnTyrGluArgAlaArgArgProGlyLeuLeuGlyAlaSerVal 680 

CTGGGCCTGGACGATATCCACAGGGCCTGGCGCACCTTCGTGCTGCGTGTGCGGGCCCAG 2100 

LeuGlyLeuAspAspIleHisArgAlaTrpArgThrPheValLe.^rgVaiArgAlaGln 700 

GACCCGCCGCCTGAGCTGTACTTTGTCAAGGTGGATGTGACGGGCGCGTACGACACCATC 2160 

AspProProProGluLauTyrPheValLysValAspValThrGlyAlaTyrAspThrlle 720 

CCCCAGGACAGGCTCACGGAGGTCATCGCCAGCATCATCAAACCCCAGAACACGTACTGC 2220 

ProGlnAspArgLeuThrGluVallleAlaSerllelleLysProGlnAsaThrTyrCys 740 

GTGCGTCGGTATGCCGTGGTCCAGAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAG 2280 

ValArgArgTyrAlaValValGlnLysAlaAlaHisGlyHisValArgLysAlaPheLys 760 

AGCCACGTCTCTACCTTGACAGACCTCCAGCCGTACATGCGACAGTTCGTGGCTCACCTG 2340 

SerHisValSerThrLeuThrAspLeuGlnProTyrMetArgGlnPheValAlaHxsLeu 780 

CAGGAGACCAGCCCGCTGAGGGATGCCGTCGTCATCGAGCAGAGCTCCTCCCTGAATGAG 2400 

GlnGluThrSerProLeuArgAspAlaValVallleGluGlnSerSerSerLeuAsnGlu 800 

GCCAGCAGTGGCCTCTTCGACGTCTTCCTACGCTTCATGTGCCACCACGCCGTGCGCATC 2460 

AlaSerSerGlyLeuPheAspValPheLeuArgPheMetCysHisHxsAlaValArglle 820 

AGGGGCAAGTCCTACGTCCAGTGCCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTG 2520 

ArgGlyLysSerTyrValGlnCysGlnGlylleProGlnGlySerlleLeuSerThrLeu 840 

CTCTGCAGCCTGTGCTACGGCGACATGGAGAACAAGCTGTTTGCGGGGATTCGGCGGGAC 2580 

LeuCysSerLeuCysTyrGlyAspMetGluAsnLysLeuPheAlaGlylleArgArgAsp 860 

GGGCTGCTCCTGCGTTTGGTGGATGATTTCTTGTTGGTGACACCTCACCTCACCCACGCG 2640 

FIG. HE 




GlyLeuLeuLeuArgLeuValAspAspPheLeuLeuValThrProHisLeuThrHisAla 880 

AAAACCTTCCTCAGGACCCTGGTCCGAGGTGTCCCTGAGTATGGCTGCGTGGTGAACTTG 2700 

LysThrPheLeuArgThrLeuValArgGlyValProGluTyrGlyCysValValAsnLeu 900 

CGGAAGACAGTGGTGAACTTCCCTGTAGAAGACGAGGCCCTGGGTGGCACGGCTTTT 2760 

ArgLysThrValValAsnPheProValGluAspGlxiAlaLeuGlyGlyThrAlaPheVal 920 

CAGATGCCGGCCCACGGCCTATTCCCCTGGTGCGGCCTGCTGCTGGATACCCGGACCCTG 2820 

GlnMetProAlaHisGlyLeuPheProTrpCysGlyLeuLeiiLeuAspThrArgThrLeu 940 

GAGGTGCAGAGCGACTACTCCAGCTATGCCCGGACCTCCATCAGAGCCAGTCTCACCTTC 2880 

GluValGlnSerAspTyrSerSerTyrAlaArgThrSerlleArgAlaSerLeuThrPhe 960 

AACCGCGGCTTGAAGGCTGGGAGGAACATGCGTCGCAAACTCTTTGGGGTCTTGC 2940 

AsnArgGlyPheLysAlaGlyArgAsnMetArgArgLysLeuPheGlyValLeuArgLeu 980 

AAGTGTCACAGCCTGTTTCTGGATTTGCAGGTGAACAGCCTCCAGACGGTGTGCACCAAC 3 000 

LysCysHisSerLeuPheLeuAspLeuGlnValAsnSerLeuGlnThrValCysThrAsn 1000 

ATCTACAAGATCCTCCTGCTGCAGGCGTACAGGTTTCACGCATGTGTGCTGCAGCTCCCA 3060 

IleTyrLysIleLeuLeuLeuGlnAlaTyrArgPheHisAlaCysValLeuGlnLeuPro 1020 

TTTCATCAGCAAGTTTGGAAGAACCCCACATTTTTCCTGCGCGTCATCTCTGACACGGCC 3120 

PheHisGlnGlnValTrpLysAsnProThrPhePheLeuArgVallleSerAspThrAls 104 0 

TCCCTCTGCTACTCCATCCTGAAAGCCAAGAACGCAGGGATGTCGCTGGGGGCCAAGGGC 3180 

SerLeuCysTyrSerlleLeuLysAlaLysAsnAlaGlyMetSerLeuGlyAlaLysGly 106 0 

GCCGCCGGCCCTCTGCCCTCCGAGGCCGTGCAGTGGCTGTGCCACCAAGCATTCCTGCTC 3 24 0 

AlaAlaGlyProLeuProSerGluAlaValGlnTrpLeuCysHisGlnAlaPheLeuLeu 1080 

AAGCTGACTCGACACCGTGTCACCTACGTGGCACTCCTGGGGTCACTCAGGACAGCCCAG 3 3 00 

LysLeuThrArgHisArgValThrTyrValProLeuLeuGlySerleuArgThrAlaGln 1100 

ACGCAGCTGAGTCGGAAGCTCCCGGGGACGACGCTGACTGCCCTGGAGGCCGCAGCCAAC 3 3 60 

ThrGlnLeuSerArgLysLeuProGlyThrThrLeuThrAlaLeuGluAlaAlaAlaAsn 112 0 

CCGGCACTGCCCTCAGACTTCAAGACCATCCTGGAC 3 4 20 

ProAlaLeuProSerAspPheLysThrlleLeuAsp 113 2 
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Truncated protein 3 



CGGCGCCTGGGGCCCCAGGGCTGGCGGCTGGTGCAGCGCGGGCACCCGGCGG L I ' l llL( J CGaxrreGTGGCCCAGTGCL M Itk.lXVl' ^ 

RRLGPQGWRLVQRGDPAAPRALVAQCLVCVPWDARPPPAA 

CCC C T C CTT C CGCCAGGTGTCCTGCCTGAAGGAG l ' ira jrG^ 
PSPRQVSCLKBLVARVLQRLCBRGAKNVLAPGFALLDGAR 



GGPPBAPTTSVR 



YLPM TVTDALRGSGAWGLLLRRVGDDV 



ACACGCTAGTGGACCCCGAAGGCGTCTGGGATGCGAACGGGCCTGGAACCATAG 
HASG PRRRLGCBRAWMHSVRSAGVPLGLPAPGARRRGGSA 

CAGCCGAAGTCTGCCGTTGCCCAAGAGGCCCAGGCGTGGCGCTGCCCCTGAGCCGGAG 
SRSLPLPKRPRRGAAPSPBRTPVGQGSWAHPGRTRGPSDR 

TG UlTllliaVlV^l^ltJ lCCTGCCaGACCC^ 
GPCVVSPARPABBATSL3CALSGTRHSHPSVGRQKHAGPP 



CGCCTTGTCCCCCGGTGTACGCCGAGACCAAGCACTTCCTCTACTCCTCAGGCGACAAG 
STSRPPRPWDTPCPPVYA37KHPLYSSGDICEQLRPSPLLS 



CTCrcn^AGGCCCAGCCTGACTGGCGCrCGGAGGCTCGTGGAG^ 
SLRPSLTGARRLVBTIPLGSRPWMPGTPRRLPRLPQRYWQ 



AATGCGGCCCCTG 
M R P L ? L 



ACCACC^GCAGTGCCCCTACGGGOT:^:^ 
LLGSHAQCPYGVLLKTHCPLRAAVTPAAGVCAR 



GGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCGAGGAGGAGGACACAGACCCCCj 
BXPQGSVAAPSESDTDPRRLVQLLRQHSSPWQVYGFVRAC 

CCTGCGCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCCAGGC^ 
LRRLVPPGLWGSRHMERRPLRMTKKPISLGKHAKLSLQEL 

GACGTGGAAGATGAGCGTGCGGGACTGCGCTTCXXTrGCGCAGGAG^ 
TWKMSVRDCAWLRRS PGVGCVPAASHRLR3E ILAKPLKWL 

GATGAGTGTGTACGTCGTCGAGCTGCTCAGGTCITTCTTTT^ 
MSVYVVBLLRSPPYVTBTTPOKNRLFPYRKSVWSKLQSIG 

AATCAGACAGCACTTGAAGAGGGTGCAGCTGCGGGAGCTnTC 
IRQHLKRVQLRELS3A3VRQHREARPALLTSRLRFIPKPD 

CGGGCTGCGGCCGATTGTGAACATGGACTACGTCGTGGGAGCCAGAACGTTCCG 
GLRPIVMMDYVVGARTPRR3KRASRLTSRVKALPSVLNY3 

GCGGGCGCGGCGCCCCGGCCTTCCTTGGGCGCCTCTGTGCTGGG^ 
RARRPGLLGASVLGL0DIHRAWR7PVI.RVRAQDPPPEt.YP 

TGTCAAGGTGGATGTGACGGGCGCGTACGACACCATCCCCCAGGACAGGCTCACGGAGGTCAT 
VKVDVTGAYOTI PQDRLT3VIASI IKPQNTYCVRRYAVVQ 

GAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGCCACCTCTCTACCT^ 
KAAHGHVRKAPKSHVSTLTDLQPYMRQPVAHLQETSPLRD 

TGCCGTCGTt^TCGAGCAGAGCTCCTCCCTGAATGAGGCt^GCAGTGGCCT 
AVVIEQSSSLMBASSGLPDVPLRPMCHHAVRIRGKSYVQC 

CCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTGCTCTGCAGCCTG^ 
QGIPQGSrLSTLLCSLCYGDMSMKLPAGtRRDGLLLRLVD 

TGATTTCTTGTTCGTGACACCTCACCTCACCCACGCGAAAACCTTC 
DPLLVTPHLTHAKTPLRTLVRGVP3 YGCVVNLRKTVVNPP 

TGTAGAAGACGAGGCCCTGGGTGGCACGGCTTTTGTTC^GATGCCGG^ 
VSDEALGGTAPVG.MPAHGLPPWCGLLLDTRTLEVQSDYSR 

GTGAGCGCACCTGGCCGGAAGTGGAGCCTGTGCCCGGCTGGGGCAG 



TGCCACAGGGTGCCCCTCCTCCCATCTGGGGCTGAG^ 



rTATTTTGGTAA 
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Altered C-terminus protein 



ATCCCGCGCGCl lL L ll^ i ljU J U U aXXJIXX rar^ 

H P RAPRCRAVRSttLRSHTR SVL P L A T P V 



CCCC 
P 3 



CCTGCCTGAAGGAGCTGGTGGCCCGACTCCItXSVGACGC^^ 
QVSCLKBLVARVLQRLCBRGAKHVLAPGPALLDGAR 



GGPPSAFTTSVRSYLPMTVTQALRGSGAWGLLI. 



R V G D D V 



LVHLLARCALFVLVAPSCAYQVCGPPLYQLGAATQARPPP 

ACACGCTAGTGGACCCCGAAGGCGTCTGGGATGCGAACG^ 
HASGPRRRLGCBRAWU33V23AGVPLGLPAPGARRRGGSA 




ccctctctogcacgcgccactcccacccatccgtcxx^ 

alsgtrhshpsvgrqhhagpp 



ATC&CATCGCGGCCACCACGTCCCTGGGACACGCCT^ 
STSRPPRPWDTPCP?VYA37!Ca?LYSSGDKBgLRPSPLLS 



CTCTCTGAGGCCCAGCCTGACTGGCGCTCGGAGGCTCGTGGAGACC^ 
SLRPStTGARRLVSTIPLGSRPWNPGTPRRLPRLPQRYWQ 



m 

I'M 



AATGCGGCCCClUlTl U IXjGAGCTGCTTGGGAACCACGCGCAGTG 
MR'PLPLSLLGNHAQCPYGVLiKTHCPLRAAVTPAAGVCAR 

GGAGAAGCCCCAGGGC7CTGTGGCGGCCCCCGAGGAGGAGGAGA(^ 
EKPQGSVAAP33S3T0PRR1VQLLRQHSSPWQ7YGPVRAC 



CCTCCGCCGGCTGCTGCCCC^GGCCTCTGGGGCTCCA^^ 
LRRLVPPGLWGSRHM3RR 



CCTC^CGAJkCACCAAGAACrrTCATCTCCCTGGGGAAGCATGCCAAGCT 
wRMTKXPISLGKKAKLSLQSL 



GACGTOGAAGATGAGCGTGCGGGACTGCGCTTtXXTrOCSCAGCAG^ 
TWXMSVR3CAWLRR5PGV3ZVPAASHR 



rTGCGTGAGGAGATCCTGGCCAAGTTCCTGCACTGGCT 
CREEILAXFLHML 



GATGAGTGTGTACGTCGTCGAGCrGCTCAGGTCTTTCTTTTAT^ 
HSVYVVBLLRS??YVT37T?33CJIRLPPYRKSVWSKLQSIG 



AATCAGACAGCACTTGAACyUXXTTGCAGCTOCGGGAGCTGTCG^^ 
IRQHLICRVQLRELS3A3VR33RSAR?ALLTSRLRPr?ICPD 

CGGGCTGCGGCCGAT7GTGAACATGGACTACGTCGTGGGAGCCAGAAOT 
GLRPIVMMDYVVGARTPRR3X3A3RLTSRVKALPSVLNYE 



GCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTXrrGTXKTrGGGCCTGGA 
RARRPGLLGASVLGLOSiaSAURTPVLRyRAQOPPPSLYP 



TGTCAAGCrrGGATGTGACGGGCGCGTACGACACCATCCCCCAGGACAG^ 
VKVDVTGAYDT I PQDR-73 7 IAS I IKPQNTYCVRRYAVVQ 



GAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAC^CACGTCTC7ACC^^ 
KAAHGHVRKAPKSHVSTL73L0PYMRQPVAHLQ3TSPLRD 



TGCCGTCGTCATCCAGCACAGCTCCTCCCTCAATGAGCCCAGCAGTGGCC^^ 
AVVIBQSSSLM3ASSGL?3V?LRPMCHHAVRIRGKSYVQC 



CCAGGGGATCCCGCAGGGCTCCATCCTCirCACGCTGC7CTGCAG^ 1 I, I ' i ' ltj CGGGGATTCGGCGGGACGGGCTGCTCCTGC U IT 1 U. lli GA 

Q G I PQGS ILSTLLCSLCYG3M3MKLPAG IRRDGLLLRLVD 

ACACCTCACCTCACCCACCCGAAAAC 
V7PHLTHAKTPLR 

TCTAGAAGACGAGGCCCTTXXrTGGCACGGCTTTTGTTCAG^ 
VBOBALGGTAPVQMPAHGLPPWCGLLLDTRTLBVQSDYSS 

CTATGCCCGGACC7^CATTLAGAGCCAGTC7CACCTTCAACCGCGGCTTCAAGGCTO 
YARTSIRASLTPMRGPKA3RMMRRKLPGVLRLKCHSLPI.D 

TTTGCAGGTCAACAGCCTCCAGACGGTGTGCACCAACATCTACAAGATC 
LQVH5LQ7VCTN I Y K I LLLQAYRPHACVLQLP FHQQVWKN 

CCCCACATTTT7CCTGCGCG7CATC7rCTGACaCGGCCTCCCTCrGCT 
P7P?LRVr5DTASLCYS ILKAKMAB 

! 

CCGAAGAAAACATT7C7GTCGTGACTCC7GCGGTGCTTGGGTC 
3BWILVV7PAVLGS 



GGGACAGCCAGAGATGGAGCCACCCCGCAGACCGTCGGGTGTGGGCAGCT^ 
GQPSMHPPRRPSGVGSPPV3 



TCCTGGGAGGGGAGTTGGGCTGGGCCTGTGACTCCTCAGCCTCTC^ 
PGRGVGLGL * 
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Protein that lacks moti 



R L G 



RAP 

CCCAGTGCCTGGTGTCCGTGCCCTGGGACGCACGGCCGCCCCCCGCCGC 
GWRLVQRGDPAAFRALVAQCLVCVPWDARPPPAA 




JCGCGTGGGCGACGACGT 
R V G D D V 

G C -XX ^ l-lt J UZCTGCTGGCACGCTXSaXX X. 'i' C l T l U 1 UL 1 U» I G GCTCCCAGCrGCGCCTACCAGGTGTGCGGGCCGCCGCTGTACCAGCT 
LVHLLARCALFVLVAPSCAYQVCGPPLYQLGAATQARPPP 



ACACGCTAGTGGACCCCGAAGGCGTCTGGGAT 
HASGPRRRLGCSRAWMH 



GVPLGLPA 



A R R R 



CAGCCGAAGTCrGCCGTTGCCCAAGAGGCCCAGGCGTGGCGCT^ 
SRSLPLPKRPRR<3AA pB?3aTPVG< 3 GSMAHPGRTRaPSDR 

TCUlTlLUu i l. UA .ll.lLACCTOCCACACCCGCCS^^ 
GPCVVSPARPA3SATSLBGALSGTRHSHPSVGRQHHAGPP 

ATCCACATCGCGGCCACCACGTCCCTGGGACACGCCTTGTCCCCCGGT^ 
STSRPPRPV#DTPCPPVYA3TKHPLYSSGDKBQLRPSPLI.S 



CTCTCTtauSGCCCAGCCTGACTGGCGCTCGGAGGC^ ».an. 
SLRPSLTGARRLVSTI PLGSRP WMPGTPR 



RLPRLPQRYWQ 

:CACGCGCAGTGCCCCTACGGGGTGCTCCTCAAGACGCACTGC^ 



Q C 



VLLKTHCPLRAA 



A A G V C A 



GGACU^AGCCCCAGGGCTCTXTrGGCGGCCCCCGAGGAGGA 

BKPQGSVAAP E32DTQ PRRLVQLLRQHSSPWQVYGPVRAC 

CCTGCGCCGGCTGGTGCCCCCAGGCCTCTGGGCX7^ 

L RRL*VP PGLWGSRHMS R 3 ?L.RMTKK? I S LGKHAKLS LQ3 L 



GACGTCK^GATGAGCGTGCGGGACTGCGCTTGGCTGCGCAGGAG^ 
TMKMSVR0CAMLRR3PGV; 



rTXTTTCCGGCCGCAGAGCACCGTCTGCGTGAGGAGATCCTGGCCAAGTTCC^ 
VPAASHRLREE ILAKFLHWL 



GATGAGTGTGTACGTCCTrCGAGCTGCTCAGGTCTrTtrrTTTATGTCACG 
MSVYVVBL*LRS»?Y7TSTT?QKMRLPPYRKSVWSKLQSIG 

AATCAGACAGCACTTGAAGAGGGTGCAGCTCCGGGAGCTGTCGGAAGG 
I RQHLKRVQLRSLS3ASVR-3aRBARPALLTSRLRPI PKPD 

CGGGCT"GCGGCCGAT" T *G7 1 GAACATGGACTACGTCGTGGGAGCCAGAA 
OL*RPl"yMM0YVyGARTPRR3KRAERLTSRVKALPSVLHYa 

GCGCOCGCGGCGCTCCOGC^CCTCGGCSCCTl'ltji rc 

rarrpgllgasvlgldo:hrawrt?vlrvraqdpppsi*yp 

gacaggctcacggaggtcatcgccagcatcatcaaaccccagaacacgtac^^ 

0rlt3viasi ikpqmtycvrryavvq 

CAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGCCACGTCTCT^ 
KAAHGHVRKAPXSHVST^TDLQPYMRQFVAHLQETSPLRD 

TCCCGTCGT^TCC^GCAGAGCTCCTCCCTXIAATGAGGCCAG 
AVVIEQSSSLNBASSGLPOVPLRPMCHHAVRIRGXSYVQC 

CCAGOOGATCCCGCAGGGcicCATCCTCTCGK^ 
Q G I PQG5 IL5TLLC5LCYG3MEMKLPAGIRRDGLLLRLV0 



TGTCAAG 
V K 



1ACACCTCACCTCACCCACGCGAAAACCTTCCTCAGGACC 
TPHLTHAKTPLRT 



TCCGAGGTGTCCCTGAGTATGGCTGCGTGGTGAACTTGCGGAAGACAGTGGTGAA 

RGVPEYGCVVNLRKTVVNPP 



TCTAGAAGACGAGGCCCTGGGTOSCACGGCTTTTG^ 
VBDBALGGTAPVQMPAHGLPPMCGLLLDTRTLEVQSDYSS 

CTATGCCCGGACCnrCATCACAGCCAGTCrCACCTTCAACCG^ 
YART5IRASLTPMRGPKAGRMMRRKL7GVLRLKCHSI-PL-D 

TTTGCAGGTGAACAGCCTC^GACGGTGTGCACCAACATCTACAAGAT^ 
LQVMSLQTVCTMI Y K I LLLQAYRFHACVLQLPFHQQVWKN 

CCCCA<^TTmCCTGCGCGTCATCTCTGACACGGC^ 
PTPPLRVISDTASLCYSILKAICHAGNSLGAKGAAGPLPSB 



GGCCGTGCAGTGGCTGTGCCACCAAGCATTCCTGCTCAAGCTTIACTCGACAC 
AVQWLCHQAFLLKLTRHR 



tCCTACGTGCCACTCCTGGGGTCACTCAGGACAGCCCAGACGCAGCTGAGTCGGAAGCTCCC 
YVPLLGSLRTAQTQLSRKLP 



GGGGACGACGCTC^CirXTCCTGGAGGCCGCAGCCAACCCCW^ 
GTTLTALEAAASPALPSDPKTI L D 

CTGTCACGCCGGGCTCTACGTCCCAGGGAGGGAGGGGCGGCCCACACCCAGGCCCO 

GAGTGTCCGGCTGAGGCCTGAGCGAGTGTCC^GCCAAGGGCTGAGTGTCC^ 

CAGGAGCCCGGCTTCCACTCCCCACATAGGAATAGTCCATCCCCAG 

GGACCCTGGGAGCTCTGGGAATTTGGAGTGACCAAAGGTGTGCCCTGTAC^ 

AATACTGAATATATGAGTTTTTCAGTTTTGA 



FIG. Ill 



ated protein that lacks 



f A 



PRAPRCRAVRSLLRSHTRBVLPI.ATPV 




LVHLLARCALPVLVAPSCAYQVCGPPLYQLGAATQAR 



ACACGCTAGTGGACCCCGAAGGCGTCTGGGA' 



:CCIT3GGCCTGCC»GCCCCGGGTGCGAGGAGGCGCGa 



HASGPRRRLGCBRAWlfHSVRBAGVPLGLPAPGA 



R R G G S A 



RSLPLPKRPRRGAAP3 



:CCACCCGGGCAGGACGCGTGGACCGAGTGACCG 
3RTPVGQGSWAHPGRTRGPS0R 

^CGCCGAAGAAGCCACCTCITTGGAOGGTGCGCTCTCTGGCACGCGCCACTCCCAC^ 
G P C V V S p ARPABSATSLBGALSGTRHSHPSVGRQHHAGPP 

ATCCACATCGCGGCCACCACwTCCCTGGGACACGCCTTGTCCCCCGGTff 
STSRPPRPWDTPCPPVYABTKHPLYSSGOKEQLRPSPIiLS 



CTCTCTGAGGCCCAGCCTGACTCGCGCTCGGAGGC'l'Ltj lOGAGACCA i n.^ 
SLRPSLTGARRLV3TI PL 



SRPWM PGTPRRLPRLPQRYWQ 



CCCrACGa^'rGCrCCrCAAGACGCACTGCCCGCTGCGAGC^ 
HAQCPYGVLLKTHCPLRAAVTPAAGVCAR 

GGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCGAGGAGGAGGACAC^ 
EKPQGSVAAP333DTDPRRI.VQLLRQHSSPWQVYGPVRAC 

CCTTX^CGGCTXXrnKCCCCAGGCCTCTOGGa 
LRRL*V??3LMGSRH!l3aR?^RMTKKP:SLGKHAKLSLQ3L 

rrCTTCCGGCCGCAGAGCACCGTCTGCGTGAGGAGATCCTGGCC^ 
7PAAEHRLRBE ILAKPLHWL 



GACGTGGAAGATGAGCGTGCGGGACTGCGCTTGGCTGCGCAGGAGCCCAGGGGTTC 
TMKMSVR3CAMLRRSP3V: 

GATGAGTCTtTTACCTCSTCGACXTrCCTC^^ 
MSVYVV2LLR3??* v ' rs ' r " : ' ? 9 KNaL?PYRKSVWSKLQSia 

AATCAGACAGCAC"TGAAGAGGGTGCAGC7GC0GG^ 
IRQHLKRVQLR3L33A3VaoaaBARPALLTSRLR?IPKPO 

CGGGCTtXTCGCCGATTCrrGAACATGGACTACGTC3TGGG^ 
GLRPIVMMDYVVGARTPRR3KRA3RLTSRVKALFSVLMYE 



GCGGGCGCGGCGCCCCGGCCrCCTGGGCGCC^ 
RARRP3LLGASVLGL03 * 3RAWRTPV 



CCCAGGACCCGCCGCCTGAGCTGTACTT 
AQDPPPSLYP 



GACAGGCTCACCGAGCrrCATCGCCAGCATCATCAAACCCCAGAACACGTACTGCGTGC 

drlt3v:asi ikpqmtycvrryavvq 



TGTCAAG 
V K 

GAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGCCAC3 
KAAKGHVRXAPKSH 

TGCCGTCCTTCATCC^GCAGAGCTCCTCCCTGAATGAGGCCAGCAGTGGC 
AVVIBQSSSLMBASSGL?3V?iRPMCHHAVRIRGKSYVQC 

CCAGGGGATCCCGCAGGGcit^TCCrrCTCeACGC^^ 1 ^^vJGA 

QGIPQGS I LSTLLCSLCYGSMEMKLPAGrRRDGLLLRLVD 

D ? L L V T P^H LTHAKTPLRTLVRGVPEYGCVVMLRKTVVNPP 

rriibi : c agatgccggcccacggcctattcccctggtgcggcl'i'oc'1'(j<- : cgatac ccgcac cctggaggtgcagagcgactactccag 

A LGGTAPVQM PAHGL7PWCGLLL0TRTLEVQS DY3R 



V 3 



GTGAGCGCACCTGGCCGGAAGTGGAGCCTTjnjCCCGG 



TGCCACAGGGTGCCCCTCGTXrCCATCTGGGGCTGAGCACAAATGCAT 



TGGGAGTGAGGGTGCCTCACAACGGGAGCAGTTTTCTGTGCTATTTTGGT. 



FIG. 11 J 



motif A and altered C-t^BFinus 



ATI 
M 



CCGCTOCCSAGCXXrrtXBCTCCCTGCTGCGCAGC^ 
PRCRAVRSLLRSHTREVLPLATFV 



CGGCGCCTGGGGCCCCAGGGCTXXXGG C n\ ^ n X 3lGC^^ H.U^CGCGClUi'l'OGCC 
RaLGPQGWRI.VQaaOPAA?2Al.VAQCLVCVPW 



P P A A 



ACGTGCTGGCCTTCGGCTTCGCGCTGCTGGACGGGGCCCG 
VLQaLCBRGAKHVLAPGPALLDGAR 

CGGGGGCCCCCCCGAGGCCTTCACCACCAGCGTGCGCAGCT 
GGPPSAPTTSVRSYLPMTVTDALRGSGAWGLLLRRVGDDV 

eCGCCGCTGTACCAGCTCGGCGCTGCCACTCAGGTC 
LVAPSCATQVCGPPUYQLGAATQARPPP 

ACACGCTAGTGGACCCC 
H A S G P a 

TTGGGCAGGGGTCCTOGGCCCACCCGGGCAGGACGCGTGGACCGAGTGACCG 
RTPVGQGSWAHPGRTRGPSDR 

TGGTTTCTtTrTTTGGTGTCACCTGCCAGACC^ 
GPCVVSPARPASEATSLSGALSGTRH5HP5VGRQHHAGPP 

ATCCACATCGCGGCCACCACGTCCCTCX^CA^ 
STSR p P RPSIDTPCPPVYAE?KHPI,YSSGDKEQI.RPSPLLS 

CTCTCTGAGGCCCAGCCTGACrGGCGCTCGGAGGCTCGTGGA 
Slt RPSLTGARRLVETIPLG3R?WMPGTPRRLPRLPQRYWQ 



AATGCGGCCCCTGTTTCTG 

ELLGNHAQCPYG 

GGAGAAGCCCCAGGGCTCT^rTGGCGGCCCCCGAGGAGGAGGACACAG^ 
BKPQGS*VAAPEBSDTD?aRLVQLLRQHSS?HQVYGPVaAC 

CCTGCGCCGGCTGGTGCCC^CAGGCCTCTGGGGCTCCAGGCACAACGAACGCCGC^ 
L*RRl/vP?GLWGSRHM2fta?:.a>ITKKF I SLGKHAKLSLQEL 



GACGTGGAAGATGAGCCTGCGGGACTGCGCTTGGCTGCGCAGGAGCCC 
THKMSVaaCAMLRRS? 



CGGTTGG v. , . - - J ;ui C CGGCCGCAGAGCACCGTCTGCGTGAGGAGATCCTGGCCAAGTTCCTGCACTGGCT 
1YG = 7?AASHRLRBS i LAKPLSWL 



OAraGTGTGTACGTCGTCGACXTrGCTCAC^ 
HSVYVVELLRSPPYVTSTTP3KMRLPPYRICSVWSKLQSIG 

AATCAGACAGCAC'TGAAC^GGGTGCAGCTGCGGGAGCTGTCGG^ 
IRQHLKRVQLREt.SEA2VR3HReARPALLTSa-LaPIPKPD 

QL*Rp 1_ I*VMMDYVVGART7Ra3KRASRLTSRVKALPSVLMYE 

GCCX^GCGGCGCCCCGGCCTCCTGGGCC^CTCTGTGCTGG^ 
RAR R PGL*Ij*GA S V I* G I* D □ I H RAWRTPVLRVRAQ D P P P 2 L Y P 

GACAGGCTCACGGAGGTCATCGCCAGCATCATGAAACCCCAGAACACGTACTCC 

DRLTSVIASI I KPQNTYCVRRYAVVQ 



TGTCAAG 
V K 



GAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGC CACGTCTCTACCTTGACAGAC CTC CAGCCGTACATGCGACAGTTCGTGGCTCACCTGCAGGAGACCAGCCCGCTGAGGGA 
KAAHGHVRKAPKSHVSTLTDLQPYMRQPVAHLQETSPLRD 

TGCCGTCGTCATCGAGCAGAGCTCCTCCCTGAATGAGGCCAGCAGTGGCw i i_ i . CGACGT 
A V V I BQS3SLNEASSGLPDV 



CCTACGCTTCATGTGCCACCACGCCGTGCGCATCAGGGGCAAGTCCTACGTCCAGTG 
LRPMCH-KAVR IRGKSYVQC 



CCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTGCTCT 
QGIPQGSILSTLLCSLCYGDM3MKLPAGIRRDGLLLRLV0 

TGATTTCTTGTrGCTGACACCTC^CCTCAC^ 
DPLLVTPHLTHAKTPLRTLVRGyPEYGCVVNLRKTVVNPP 



TGTAGAAGACGAGGCCCTGGGTGGCAC 
VSDEALGGT 



ATGCCGGCCCACGGCL : A JXCCCTGGXGCOGCCircTOCTOGATACCCSGACCCT^ 
PVQMPAHGLPPWCGLLUDTRTLSVQSDY3S 



CTATGCCCGGACCTCCATCAGAGCCAGTCTCACCTTC^ 
YARTSrRASLTPNRGPKAGRNMRRKLFGVLRLKCHSLPLD 

TTTGCAGGTGAACAGCCTCC^GACGGTGTG^ 
LQVMSLQTVCTHIYKILLLQAYRPHACVLQLPPHQQVMKW 

CCCCACATTTTTCCTGCGCGTCATCTrrGAC^ 
PTPP*LRV I S OTASLCYS I LKAKNAE 

i 

CCGAAGAAAACATTTCTGTCGTGACTCCTGCGGTGCTTGGGTC 
EEil I LVVTPAVLGS 

GGGACAGCCAGAGATGGAGCCACCCCGCAGACCGTCGGGTGTGGGCAGCTTTC CGGTGTCTC CTGGGAGGGGAGTTGGGCTGGGCCTGTGAC 
GQPEMBPPRRPSGVGSPPVSPGRGVGLGL- 



FIG. UK 



a 



N-t 



nal truncated telomeras 



er. 2) 




RRLGPQGWRLVQRGDPAAFRALVAQCLVCVPWDARPPPAA 



ATGCGGAGAGCAGCGCAGGCGACTCAGGGCGCTTCCCCCGCAGGTG 
GLPGVGVRLGLRAAGGNQRHABSSAGDSGRPPRR 
ASPGSASGWG*GRPGGTSDNRRAAQATQGASPAG 
PPRGRRPAGVSGGRGBPATCGEQRRRLRALPPQV 



PSPRQVSCLKSLVARVLQRI.CERGAKNVLAFG 



A L L D G A R 



CGGGGGCCCCCCCGAGGCCTTCACCACCAGCGTGCGCAGCTACCTGCCCAACAC^ 
GGPPBAPTTSVRSYLPMTVTDALRGSGAWGLLI.RRVGDDV 




CAGCCGAJUTTCTGCCGTTGCCCAAGAGGCCCAGGC^^ 
SRSLPLPKRPRRGAAPSPBRTPVGQGSWAHPGRTRGPSDR 



CCTGCCACACCCGCCGAAGAAGCCAC lll 11 ll.U l GC GTt X 3SCrCTC ra GCACGCGCCAC^ 
GFCVVSPARPAEBATSL3GALSGTRHSHPSVGRQHHAGPP 



ATCCACATCCiCGGCCACCACGTCCCTGGGACACGCCrrm^ 
STSRPPRPWDTPCPPVYA3TKHPLYSSGDKEQLRPSPLLS 



if »% 



CTCTCTGAGGCCCAGCCTGACrGGCGCTCGGAGGCTCGTGGAGACCAT L r ■ ■ ll L\*U, l ' IT. ' J AGGCCCTGGATGCCAGGGACTCCCCGCAGGTTGCCCCGCCTGCCCCAGCGCTACTGGCA 
SLRPSLTGARRLV3TIFI.GSRPWMPGTPRRLPRI.PQRYWQ 



AATGCGGCCCCTGTTTC 
M R ? L P 



LGMHAQCPYGVS. 



I'll 



GGAGAAGCCCCAC 
E K P Q G 5 



CCCCCGAGGAGGAGGACACAGACCCCCCTCCKXrrGGTGCAG^ 
VAAPES30TDP3RLVQLLRQHSSPWQVYGFVRAC 



CCTGCGCCGGCrGGTGCCCCCAGGCCTCTGGGGCTCCAGGCACAACGAACGC'w'^O 1 . V_ .l-AGGAACACCAAGAAGTTCATCTCCCTGGGGAAGCATGCCAAGCTCTCGCTGCAGGAGCT 
LRRLVPPGLWGSRHSSRRPLRMTlCKPrSLGKHAKLSLQSL 



GACGTGGAAGATGAGCGTGCGGGACTGCGCTTGGCTGCGCAGGAGCCCAGGGGT^ 
TMKM5VR3CAMLRR3PGV3CVPAAEHRLREE I LAXFLHWL 



s : .=:f 



GATGAGTGTGTACGTCGTCGACCTGCTCAGGTL"rr:i_: i 1 i ATGTCACGGAGACZAL ^ i i 1 VAAAAGAACAGGCTC i'lU'rrCTACCGGAAGAGTGTCTGGAGCAAGTTGCAAAGCATTGG 
MSVYVYELLRSFPYVT3T77QKMRLPPYR1CSVWSKLQSXG 

AAT- - NNN - - GACAGTCACCAGGGGGGTTGACCGCCGGACTGGGCGTCCCCAGGGTTGACTATAGGAC 

CATGGGTGGACGTGGCCCCGGGCATGGC L - r iL'l U CU 11 1U1 rGCCGTGGCrrCCCCTGAGCCCTCACTGAGTCGGTGGGGG 

GCTGAGCAAGCCTCCTGAGGGGCTCTCTATTG- 



^Truncated protein 1 (ver 



CCTGCTGCGCAGCCACTACCGCGAGGTGCTGCCGCTGGCCA^ 
RCRAVRSLLRSHTRBVX,PLATPV 



CGGCGCCTGGGGCCC 
RRLGPQGWR 



LVQRGDPAA 



CCCftCTGCCTt^roT G CGTGCCCTG<^CGCACGGCCGCCCCCaX:^ 
RALVAQCLVCVPWDARPPPAA 



GGCCTCC 

GLPGVGVRLGLRAAGGNQRHAESSAGDSGRPPRR 
ASPGSASGWG*GR?GGTSDMRRAAQATQGASPAG 
PPRGRRPAGVBGGRGEPATCGBQRRRLRALPPQV 

CCAGtflVrCCT G CCTGAAGGAGCTGGTGGCCCG 
PSPRQVSCLKBI»VARVI#QRI»CBRGAKMVLAPGPALLDGAR 



GGPPBAFTTSVRSYI*PNTVTDALRGSGAWGLLLRRVGDDV 




TGU Tl 'l' t. 'l tj 'l t» 'll A» 'l l» 1 CACCTGCCAGACCCGCI 
GPCVV5 PAR PAS 



ATCCACATCGCGGCCACCACGTCCCTtX^CACGCCTTXTTCCCCC 
STSRPPRPW0TPCPPVYA3TKHPLYSSGDKBQLRPSPLLS 

CTCTCTGAGGCCCAGCCTGACTGGCGCTCGGAGGCTCGTGGAGACCAT C ' 1 ' 1 " ^ 
SLRPSLTGARRLVETIPLaSRPHMPGTPRRLPRLPQRYWQ 



AATGCGGCCCCTG 
M R P L P L 



ACCACCCGCACrnKCCCTACGGGGTGCTCCTCAAGACGCACrGCCCGC^ 
LL.G.SHAQCPYGVwLKTHCPI.RAAVTPAAGVCAR 



GGAGAAGCCCCAGGGCTCTGTtXXTGGCCCCCCAGGAGGAGGACACAG^ 
BKPQGSVAAP33SDTDPRRLVQLLRQHSSPMQVYGPVRAC 



CCTGCGCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCCAGGCACAACGAACGCCG 
L.RRLVPPGLMGSRHM3RR 



rTCTCAGGAACACCAAGAAGTTCATCTCCCTGGGGAAGCATGCCA^ 

^RNTXKPISLGKHAKLSLQEL 



GACGTGGAAGATGAGCGTGCGGGACTCCGCTTGGCTGCGCAGGAGCCCAGG 
TWKHSVRDCAWLRRSPGVGCVPAA5HRLRES I LAKPLHWL 

GATGAGTGTGTACGTCGTCaAGCTGCTCAGGTCTTTCTTTTATGT^ 
MSVYVVSLLRS??YVTSTT73KMRL?PYRiCSVWSlCLQSIG 

AATCAGACAGCACTTGAAGAGGGTGCAGCTGCGGGAGCTGTCGGAAGCAGAG 
IRQHLKRVQLRSLSEA2VRQ3REARPALLTSRLRPIPKPD 

GTGGCTGTGCTTTGGTTTAACTTCCTTTTTAACCAGAA 
VAVLWPTPLPMQK 



CGGGCTGCGGCCGATTGTGAACATOGACTACGTCGTGGC^GCCA^ 
GLRPIVMMDYVVGARTFRR3SCR PSVSPRG* 



FIG. 11M 



uncated protein 2 (ver, 



C L ' XXJClti CGCAGCCACrACCGCGAGGTGCTGCC^^ 
RAPRCRAVaSLLRSHTRBVL PLATPV 

CCCCCCGCCGC 
P P P A A 

ATGCGGAGAGCAGCGCAGGCGACnX^USGGCGCTTCCC^ 
GI.PGVGVRLGLRAAGGHQRHABSSAGOSGRPPHR 
ASPGSASGWG*GaPGGTSDMRRAAQATQGASPAG 
PPRGRRPAGV3GGRGSPATCGEQRRRLRALPPQV 

CCCCTCCTTCCGCCAGGTCTTCCTGCCTGAAGGAGC^ 
PSPaQVSCLK2LVAaVLQai,CSRGAKHVLAPGPALLDGAR 

CGGGGGCCCCCCCGAGGCCrTaiCCACCAGCXrrGCGCAGCTACCTGCCCA^ 
GGPPSAFTTSVRSYLPWTV7DALRGSGAWGLI.LRRVGDDV 



ACACGCTAGTGGACCCCGAAGGCGTCITXX^TC^GAACGGGCCT^ 
HASGPRaaLGCSRAWM3SVa3AGVPLGLPAPGARRRGGSA 

CAGCCGAAGTCTGCCGTTGCCCAXGAGGCCCAGGCGTGGCG 
SRSLPL?KRPRaGAAP3P3aTPVGQGSWAHPGRTRGPS0R 

TG Gl^ 'l VIuivi^lVlTJ ^CTGCCAGACCCGCCGAAGAAGCCAC L it- 1 i *tj GAGGGT3CGCrCTCTGGCACGCGCCACTCCCACCCATCCGTGGGCCGCCAG 
GPCVVSPARPASBATSL33ALSGTRHSHPSVGRQHHAGPP 



CTCTXrrGAGGCCCAGCCTTlACTGGCGCTCGGAGGCTCGTGGAGACCA IV i. I .L. ' JU,: /, ' ^ GGCCCT^GATGCCAGGGACTCCCCGCACXriTGCCCCGCCT^ 
SLR?SLTGARRLV3Tr?i33RPWMPGT?RRL?RLPQRYWQ 

AATGCGGCCC L - lVryi ' ClT^ GAG Clt^^ 

MRPLPLSLLGMHAQCPYSVI.LXTHCPLRAAVTPAAGVCAR 

C^GJUVGCCCCAGGGCTCTGTGGCGGCCCCCGAGGAGGAG^ 
BKPQaSVAAPaaSDTDPaaiVQLLRQHSSPWQVYGPVRAG 

CCTCCCXrCGGCTCGTGCCCCIIAGGCCTCTGGGGOr^ 
LRRLVPPGLHGSRH!l3aa?-aMT!CICPrSI.GKHAKLSLQSL 



GACGTGGAAGATGAGCGTCCGGGACTGCGCTTGGCTtXTGCAGGAGCCCAGGGGT^ 
TMKMSVRDCAWLRRS?3'/3 



CCGGCCGCAGAGCACCCTTCTrtJCGTGAGGAGATCCITCXjCCAAGTTCCTGCACTGGCT 
CVPAAEHRI.a3SILAKPLHWL 



GATGAGTGTrTrACCTCGTCGAGCTGCrCAGGTCTTTCTTTTAT^ 
MSVYVV3LLRSPPYVT3TTPQKSRLPPYRKSVWSKLQSIG 

AATCAGACACCACTTGAAGAGGGTTX^GCTGCGGGACKTrcrrCGGAA 
IRQHLKRVQLRELSEA2VR3HR2ARPALLTSRLRFIPKPD 



CGGGCTGCGGCCC^TTGTGAACATGGACTACGTCGTGGGAGCCAGAACG 
G L R P rvUMDYVVGARTPaaSjCRA 



CCTCGAGGGTGAAGGCACTGTTCAGCGTGCTCAACTACaA 
TSRVKALF3VLMYS 



GCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTCTGTGCTGGG^ 
RARRPGLLGASVLGLODiaaAaaTPVLRVaAQDPPPBLYP 

TGTCAAGGTGC^TTTrGACGGGCGCGTACGACACCATCCCCCAGGACAGG^ 
VKVOVTGAYOT I PQDRLT3VIAS I IKPQMTYCVRRYAVVQ 

GAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGCCAC 
KAAHGHVRKAPKSH 

GTCCTACGTCCAGTG 
V L R P V 

CCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTGCTCTtX^VGC Lr 

PGD?AGLfiPLHAALQPVLaa3GSQAVCGD3AGRAAPA?VG 



TGATTTCTTTTrTGGTGAGACCTCACCTCACCCACGCGAA 



FIG. UN 



^J^eference protein (ver, 



ATGCCGCGCGCTCCCCGCTGCCGAGCCGTGCGCTCCCTGCTGCGCAGCCACTACCGCGAG 60 
MetProArgAlaProArgCysArgAlaValArgSerLeuLeuArgSerHisTyrArgGlu 20 

GTGCTGCCGCTGGCCACGTTCGTGCGGCGCCTGGGGCCCCAGGGCTGGCGGCTGGTGCAG 120 
ValLeuProLeuAlaThrPheValArgArgLeuGlyProGlnGlyTrpArgLeuValGln 40 

CGCGGGGACCCGGCGGCTTTCCGCGCGCTGGTGGCCCAGTGCCTGGTGTGCGTGCCCTGG 180 
ArgGlyAspProAlaAlaPheArgAlaLeuValAlaGlnCysLeuValCysValProTrp 60 

GACGCACGGCCGCCCCCCGCCGCCCCCTCCTTCCGCCAGGTG 
AspAlaArgProProProAlaAlaProSerPheArgGlnVal 

GGCCTCCCCGGGGTCGGCGTCCGGCTGGGGTTGAGCX3CGGCCGGGGG 

GLPGVGVRLGLRAAGGNQRHAESSAGDSGRFPRR 
ASPGSASGWG*GRPGGTSDMRRAAQATQGASPAG 
PPRGRRPAGVEGGRGEPATCGEQRRRLRALPPQV 

TCCTGCCTGAAGGAGCTG 240 
SerCysLeuLysGluLeu 8 0 

GTGGCCCGAGTGCTGCAGAGGCTGTGCGAGCGCGGCGCGAAGAACGTGCTGGCCTTCGGC 3 00 

ValAlaArgValLeuGlnArgLeuCysGluArgGlyAlaLysAsnValLeuAlaPheGly 100 

TTCGCGCTGCTGGACGGGGCCCGCGGGCX3CCCCCCCGAGGCCTTCACCACCAGCGTGCGC 3 60 

PheAlaLeuLeuAspGlyAlaArgGlyGlyProProGluAlaPheThrThrSerValArg 120 

AGCTACCTGCCCAACACGGTGACCGACGCACTGCGGGGGAGCGGGGCGTGGGGGCTGCTG 420 

SerTyrLeuProAsnThrValThrAspAlaLeuArgGlySerGlyAlaTrpGlyLeuLeu 140 

TTGCGCCGCGTGGGCGACGACGTGCTGGTTCACCTGCTGGCACGCTGCGCGCTCTTTGTG 4 80 

LeuArgArgValGlyAspAspValLeuValHisLeuLeuAlaArgCysAlaLeuPheVal 160 

CTGGTGGCTCCCAGCTGCGCCTACCAGGTGTGCGGGCCGCCGCTGTACCAGCTCGGCGCT 54 0 

LeuValAlaProSerCysAlaTyrGlnValCysGlyProProLeuTyrGlnLeuGlyAla 180 

G C C ACT C AGG C C C GG C C C C C G C C ACAC GCT AGTGG AC C C C GAAGGC GT C TGGGATGCG AA 600 

AlaThrGlnAlaArgProProProHisAlaSerGlyPrcArgArgArgLeuGlyCysGlu 200 

CGGGCCTGGAACCATAGCGTCAGGGAGGCCGGGGTCCCCCTGGGCCTGCCAGCCCCGGGT 660 

ArgAlaTrpAsnHisSerValArgGluAlaGlyValProLeuGlyLeuProAlaProGly 220 

GCGAGGAGGCGCGGGGGCAGTGCCAGCCGAAGTCTGCCGTTGCCCAAGAGGCCCAGGCGT 72 0 

AlaArgArgArgGlyGlySerAlaSerArgSerLeuProLeuProLysArgProArgArg 240 

GGCGCTGCCCCTGAGCCGGAGCGGACGCCCGTTGGGCAGGGGTCCT GGGCCCACCCGGGC 780 
GlyAlaAlaProGluProGluArgThrProValGlyGlnGlySerTrpAlaHisProGly 260 

AGGACGCGTGGACCGAGTGACCGTGGTTTCTGTGTGGTGTCACCTGCCAGACCCGCCGAA 840 
ArgThrArgGlyProSerAspArgGlyPheCysValValSerProAlaArgProAlaGlu 280 

GAAGCCACCTCTTTGGAGGGTGCGCTCTCTGGCACGCGCCACTCCCACCCATCCGTGGGC 900 
- GluAlaThrSerLeuGluGlyAlaLeuSerGlyThrArgHisSerHisProSerValGly 300 

CGCCAGCACCACGCGGGCCCCCCATCCACATCGCGGCCACCACGTCCCTGGGACACGCCT 960 
ArgGlnHisHisAlaGlyProProSerThrSerArgProProArgProTrpAspThrPro 320 

TGTCCCCCGGTGTACGCCGAGACCAAGCACTTCCTCTACTCCTCAGGCGACAAGGAGGAG 1020 
CysProProValTyrAlaGluThrLysHisPheLeuTyrSerSerGlyAspLysGluGln 340 

CTGCGGCCCTCCTTCCTACTCAGCTCTCTGAGGCCCAGCCTGACTGGCGCTCGGAGGCTC 10 80 
LeuArgProSerPheLeuLeuSerSerLeuArgProSerLeuThrGlyAlaArgArgLeu 360 

GTGGAGACCATCTTTCTGGGTTCCAGGCCCTGGATGCCAGGGACTCCCCGCAGGTTGCCC 1140 
ValGluThrllePheLeuGlySerArgProTrpMetProGlyThrProArgArgLeuPro 3 80 

CGCCTGCCCCAGCGCTACTGGCAAATGCGGCCCCTGTTTCTGGAGCTGCTTGGGAACCAC 12 00 

FIG. HO 



ArgLeuProGlnArgTyrTrpGlnMe' 




IroLeuPheLeuGluLeuLeuGlyAsnH: 



:is 




GCGCAGTGCCCCTACGGGGTGCTCCTCAAGACGCACTGCCCGCTGCGAGCTGCGGTCACC 
AlaGlnCysProTyrGlyValLeuLeuLysThrHisCysProLeuArgAlaAlaValThr 

CCAGCAGCCGGTGTCTGTGCCCGGGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCGAGGAG 
ProAlaAlaGlyValCysAlaArgGluLysProGlnGlySerValAlaAlaProGluGlu 

GAGGACACAGACCCCCGTCGCCTGGTGCAGCTGCTCCGCCAGCACAGCAGCCCCTGGCAG 
GliiAspThrAspProArgArgLeuValGlnLeuLeuArgGlnHisSerSerProTrpGln 

GTGTACGGCTTCGTGCGGGCCTGCCTGCGCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCC 
ValTyrGlyPheValArgAlaCysLeuArgArgLeuValProProGlyLeuTrpGlySer 

AGGCACAACGAACGCCGCTTCCTCAGGAAC^CCAAGAAGTTCATCTCCCTGGGGAAGC^T 
ArgHisAsnGluArgArgPheLeuArgAsnThrLysLysPhelleSerLeuGlyLysHis 

GCCAAGCTCTCGCTGCAGGAGCTGACGTGGAAGATGAGCGTGCGGGGCTGCGCTTGGCTG 
AlaLysLeuSerLeuGlnGluLeuThrTrpLysMetSerValArgAspCysAlaTrpLeu 

CGCAGGAGCCCAGGGGTTGGCTGTGTTCCGGCCGCAGAGCACCGTCTGCGTGAGGAGATC 
ArgArgSerProGlyValGlyCysValProAlaAlaGluHisArgLeuArgGluGluIle 

GTGGCCAAGTTCCTGCACTGGCTGATGAGTGTGTACGTCGTCGAGCTGCTCAGGTCTTTC 
LeuAlaLysPheLeuHisTrpLeuMetSerValTyrValValGluLeuLeiiArgSerPhe 

TTTTATGTC ACGGAGAC CACGTTTCAAAAGAACAGGCTL- TTTT CTACC GG AAGAGTGTC 
PheTyrValThrGluThrThrPheGlnLysAsnArgLeu?he?heTyrArgLysSerVal 

TGGAGCAAGTTGCAAAGCATTGGAATCAGACAGCACTTGAAGAGGGTGCAGCTGCGGGAG 
TrpSerLysLeuGlnSerlleGlylleArgGlnHisLeuLysArgValGlnLeuArgGlu 

CTGTCGGAAGCAGAGGTCAGGCAGCATCGGGAAGCCAGGCCCGCCCTGCTGACGTCCAGA 
LeuSerGluAlaGluValArgGlnHisArgGluAlaArgProAlaLeuLeuThrSerArg 

CTCCGCTTCATCCCCAAGCCTGACGGGCTGCGGCCGATTGTGAACATGGACTACGTCGTG 
LeuArgPhelleProLysProAspGlyLeuArgProIleValAsnMetAspTyrValVal 

GGAGCCAGAACGTTCCGCAGAGAAAAGAGGGCCGAGCGTCTCACCTCGAGGGTGAAGGCA 
GlyAlaArgThrPheArgArgGluLysArgAlaGluArgLeuThrSerArgValLysAla 

CTGTTCAGCGTGCTCAACTACGAGCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTCTGTG 
LeuPheSerValLeuAsnTyrGluArgAlaArgArgPrcGIyLeuLeuGlyAlaSerVal 

CTGGGCCTGGACGATATCCACAGGGCCTGGCGCACCTTCGTGCTGCGTGTGCGGGCCCAG 
LeuGlyLeuAspAspIleHisArgAlaTrpArgThrPheVall.euArgValArgAlaGln 

GACCCGCCGCCTGAGCTGTACTTTGTCAAGGTGGATGTGACGGGCGCGTACGACACCATC 
AspProProProGluLeuTyrPheValLysValAspValThrGlyAlaTyrAspThrlle 

CCCCAGGACAGGCTCACGGAGGTCATCGCCAGCATCATCAAACCCCAGAACACGTACTGC 
ProGlnAspArgLeuThrGluVallleAlaSerllelleLysProGInAsnThrTyrCys 

GTGCGTCGGTATGCCGTGGTCCAGAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAG 
ValArgArgTyrAlaValValGlnLysAlaAlaHisGlyHisValArgLysAlaPheLys 

AGCCACGTCTCTACCTTGACAGACCTCCAGCCGTACATGCGACAGTTCGTGGCTCACCTG 
SerHisValSerThrLeuThrAspLeuGlnProTyrMetArgGlnPheValAlaHisLeu 

CAGGAGACCAGCCCGCTGAGGGATGCCGTCGTCATCGAGCAGAGCTCCTCCCTGAATGAG 
GlnGluThrSerProLeuArgAspAlaValVallleGluGlnSerSerSerLeuAsnGlu 

GCCAGCAGTGGCCTCTTCGACGTCTTCCTACGCTTCATGTGCCACCACGCCGTGCGCATC 
AlaSerSerGlyLeuPheAspValPheLeuArgPheMecCysHisHisAlaValArglle 

AGGGGCAAGTCCTACGTCCAGTGCCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTG 
ArgGlyLysSerTyrValGlnCysGlnGlylleProGlnGlySerlleLeuSerThrLeu 

CTCTGCAGCCTGTGCTACGGCGACATGGAGAACAAGCTGTTTGCGGGGATTCGGCGGGAC 
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FIG. IIP 



LeuCysSerLeuCysTyrGlyAspMec^^nLysLeuPheAlaGlYlleArgArgAsp 

GGGCTGCTCCTGCGTTTGGTGGATGATTTCTTGTTGGTGACACCTCACCTCACCCACGCG 2640 
GlyLeuLeuLeuArgLeuValAspAspPheLeuLeuValThrProHisLeuThrH^Ala 880 

AAAACCTTCCTCAGGACCCTGGTCCGAGGTGTCCCTGAGTATGGCTGCGTGGTGAACTTG 
LysThrPheLeuArgThrLeuValArgGlyValProGluTyrGlyCysValValAsnLeu 

CGGAAGACAGTGGTGAACTTCCCTGTAGAAGACGAGGCCCTGGGTGGCACGGCTTTTGTT 
ArgLysThrValValAsnPheProValGluAspGluAlaLeuGlyGlyThrAlaPheVal 

CAGATGCCGGCCCACGGCCTATTCCCCTGGTGCGGCCTGCTGCTGGATACCCGGACCCTG 
GlnMetProAlaHisGlyLeuPheProTrpCysGlyLeuLeuLeuAspThrArgThrLeu 

GAGGTGCAGAGCGACTACTCCAGCTATGCCCGGACCTCCATCAGAGCCAGTCTCACCTTC 
GluValGlnSerAspTyrSerSerTyrAlaArgThrSerlleArgAlaSerLeuThrPhe 

AACCGCGGCTTCAAGGCTGGGAGGAACATGCGTCGCAAACTCTTTGGGGTCTTGCGGCTG 2940 
AsnArgGlyPheLysAlaGlyArgAsnMetArgArgLysLeuPheGlyValLeuArgLeu 980 

AAGTGTCACAGCCTGTTTCTGGATTTGCAGGTGAACAGCCTCCAGACGGTGTGCACCAAC 
LysCysHisSerLeuPheLeuAspLeuGlnValAsnSerLeuGlnThrValCysThrAsn 

ATCTACAAGATCCTCCTGCTGCAGGCGTACAGGTTTCACGCATGTGTGCTGCAGCTCCCA 
IleTyrLysIleLeuLeuLeuGlnAlaTyrArgPheHisAlaCysValLeuGlnLeuPro 
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TTTCATCAGCAAGTTTGGAAGAACCCCACATTTTTCCTGCGCGTCATCTCTGACACGGCC 
PheHisGlnGlnValTrpLysAsnProThrPhePheLeuArgVallleSerAspThrAls 

TCCCTCTGCTACTCCATCCTGAAAGCCAAGAACGCAGGGATGTCGCTGGGGGCCAAGGGC 3180 
SerLeuCysTyrSerlleLeuLysAlaLysAsnAlaGlyMecSerLeuGlyAlaLysGly 1060 

GCCGCCGGCCCTCTGCCCTCCGAGGCCGTGCAGTGGCTGTGCCACCAAGCATTCCTGCTC 
AlaAlaGlyProLeuProSerGluAlaValGlnTrpLeuCysHisGlnAlaPheLeuLeu 

AAGCTGACTCGACACCGTGTCACCTACGTGCCACTCCTGGGG7CACTCAGGACAGCCCAG 
LysLeuThrArgH^sArgValThrTyrValProLeuLeuGlySerLeuArgThrAlaGln 

ACGCAGCTGAGTCGGAAGCTCCCGGGGACGACGCTGACTGCCCTGGAGGCCGCAGCCAAC 3360 
ThrGlnLeuSerArgLysLeuProGlyThrThrLeuThrAlaLeuGluAlaAlaAlaAsn 1120 

CCGGCACTGCCCTCAGACTTCAAGACCATCCTGGAC 
ProAlaLeuProSerAspPheLysThrlleLeuAsp 
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# 



runcated protein 3 (ver, 



ATC ^CCCGCCX7rCCCCGC^^ 

MPaAPaCaAVRSLLRSHTRBVLPLATFV 

^T(^QG;^GAGCAGCGCAGGCGACTCAGGGCGCTTCCCCCGCAGGTG 

a L p a v a v a ~l g t. a a a e a s Q R h a e s s a g d s g r p p R a 

aLLI^^ 



RSLPLPKaPaa GAAt ' s ^ i ,t - rv " w ""* 

GPCVV3PAa?A33ATSI.3^A-i^iKna™ 

ATCCACATMCCXKCACCAC^^ 

STSaPPRP**D T?C?!? 

A^TGCGCCCC™^ 

NR PLPLS^L3»HAQC?/ J '--KTHCP-RAA 



GGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCjAGGAGGAGGACACAGACCCC^ » .^-c- - 
EKPQGSVAA?2223T3?i^-* 



GTGCAGCTGCTCCGCCAGCACAGCAGCCCCTGGCAGGTGTAC 

7 Q L L a Q H 5 S P W Q 7 Y G ? V R A C 



C^TTGTTCCGCKCG^GAGCACCGTCra 
C7PAA2HRLRES ILAXFLHWL 



GACGTGGAAGATGAGCGTGCOGGACTGCGCTTGGCTTX^ - - 

TWKMSVRDCAWLRR3PG' 



GATCACT^AC^ccTCSAGcrccrc^^ 

MSVYVV2L.LR3 E ' ?Y/ '*'* - 
IRQHLKRVQI*aEi*5-Ai a j - . 

cxrccccoccccoccccc^crc^^ 

RARRPGLLGASVLGL33-3R**«irr 

VKVDV7GAYDTI ? Q 3 R «* - S / i A a 
CAAC^CCCCCATCCGCAC^CC^^ 

kaahghvbkapksh/st-.3-a 
^ccctc^tccaoca^^ 

AVVIEQSSSLMSASaGL?3/--Krn^" n « 

cca^tcccccaoccct^^ 

QGIPQGSIl-S Tl * LUil ' u 

TGATrrcrr.nTCCTCA^^ 

D?LLVTPHLTHAK a 

VBDBALGOTA?VQM?AH^-F?WCOLLLOTRTi.»^ 
GTCACCCCACCiraCG^GTSG*^ 



A^^red C- terminus protein 



2) 



ATGCCGcexxxrrccccGcitxrctau ^ 

HPRAPRCRAVRSLLRSHTRBVLPLATPV 
CGGCGCCTGGGGCCCCAGGGCIGGCGGCTGGTG^ ItXlX GCGCIXXrrGGCCCAGTGCCTGGTCTGCGTGCCCTGGGACG 

RRI*GPQG*4RLVQRGDPAA?RALVAQCLVCVPWDARPPPAA 
gtXXTCCCCGGGGTOXXXTrCCGGCTGGGGTTG^ 

glpgvgvrlglraaggnqrhaessagdsgrpprr 
aspgsasgwg*grpggtsdmrraaqatqgaspag 
pprgrrpagvsggrgbpatcgeqrrrlralppqv 

CCCCTCCTTCCGCCAGGTGTCCTGCCTGAAGGAGCTGGTGGCC^ 
PSPRQVSCLKSLVARVLQaLCERGAKHVLAPGPALLDGAR 

CGGGGGCCCCCCCGAGGCCTTCACCACCAGCGTGCGCAGCTACCTGCCC^ 
GGPPSAPTTSVRSYLPSTVTDALRGSGAWGLLLRRVGDDV 

GCTCGTTCACCTGCTGGCA 
I.VHLLARCAL 




ACCTXKOUIACCCGCCSAAGAAGCCACCTCrTTGGAGGGTG^ 
GPCVVSPARPAB2ATSL3GALSGTRHSHPSVGRQHHAGPP 

ATCCACATCGCGGCCACCACGTCCCTGC^CAC^CTrGTCC^^ 
STSRPPRPWDTPCPPVYA3TKHPLYSSGDKEQLRPSPLLS 

CTCTCTGAGGCCCAGCCTGACTGGCGCTCGGAGGCT^ 
SL*RPSL*TGARRLVSTIPLG3R?MMPGTPRRLPR1*PQRYMQ 

CCTCAAGACGCACTGCCCGCTGCGACXTTGCGGTCACCCCAGCAGCC 
LJCTHCPLRAAVTPAAGVCAR 



AATGCGGCCCCT tj rri ' L ' iXj GAGCrGCrTGGGAACCACGCGCAGTGCCCCTACGGGGTGCr 
MRPLPLSLLGMHAQCPYGVL 



GGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCjAGGAGGAGGACACAGACCCCCGTCGCCTC 
EKPQGSVAAP3S20T3PRR1VQL 



CCnWZGCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCCAG 
LRRLVPPGLWGSRHM3RR 



CCTCAGGAACACCAAGAAGTTCATCTCCCTGGGGAAGCATGCCAAGCrCTCGCTGCAGGAG 
LRNTKKP ISLGKHAXLSLQSL 



GACGTGGAAGATC^GCGTGCGGGACTGCGCTTGGCT^ 
TMKMSVR.OCAMLRRSPGVGrVPAASHRLREE I LAXFLHWL 



GATGAGTCTGTACGTCGTCCLAGCTGCTCAGGTL * 1 . It-, i. I 1ATGTCACGGAGACCACGTTTCAAAAGAACAG 
MSVYVVSLLRS??YV?2T7?3KMRLP 



TACCGGAAGAGTGTCTGGAGCAAGTTGCAAAGCATTGG 
YRXSVWSKLQS IG 



AATCAGACAGCAC-TTGAAGAGGGTGCAGCTGCGGGACXrm 
IRQHLKRVQLRSLSEA3VR3HR3ARPALL.TSRLRPIPKP0 

CGGGCTrcGGCCGATTGTGAACATCGACTACGTCCTGGGAG^ 
GL*RP i*vSMDYVVGART?RR3KRASRI*TSRVKALPSVLNYS 

GCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTL'IXJi'GCrGGGCCTGGACGATATC 
R A R R p^G L *LGASVLGL30IHRAWRTPVLRVRAQ0PPPSLYP 

TGTCAAGGTGGATGTGACGGGCGCGTACGACACCATCCCCCAGGACAGGCTCACG^ 
VKVDVTGAYDTI PQ3RLTEVIAS I I KPQNTYCVRRYAVVQ 

GAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGCCACGTCTCTACCr^ 
KAAHGHVRKAFKSHVSTLTDLQ.PYMRQPVAHLQETSPLRD 

TGCCGTCGTCATCGAGCACAGCTCCrrCCCTGAATGAGGCCAGC^^ 
AVVIS0S5SLNEASSGLPDVPLRPHCHHAVRIRGKSYVQC 

CCAGGGGATCCCGCAGGGCTCCATCCTCTCC^CGCTGCTCTGCAGCCTGTGC^ 
QGIPQGSILSTLI*CSLCYG3MEHKLPAGIRRDGLLLRLVD 

TGATTTCTTGTTGGTGACACCTCACCTCACCC^CGC 
DPLLVTPHLTHAKTPLRTLVRGVPBYGCVVMLRKTVVMPP 

TCTAGAAGACGAGGCCCTGGGTGGCACGG C ' - ' l ' l ' lUl 1 CAGATGCCGGCCCACGGCCTATTCCC CTGGTGCGGCCTGCTGCrGGATAC CCGGACCCTGGAGGTGCAGAGCGACTACTCCAG 
VBOBALGGTAPVQMPAHGLPPWCGLLLDTRTLEVQSDYSS 

CTATGCCCGGACCTCCATCAGAGCCAGTCTC^CCTrCAACCGCGGCTTCAAGGCT^ 
Y A R T S I RASLTPNRGPKAGRNMRRKLFGVLRLKCHSLFL.D 

TTTGCAGGTGAACAGCCTCCAC^CGGTGTGCACCAACATCTACAAGATC 
LQVNSLQTVCTNI Y K I LLLQAYRPHACVLQLPPHQQVWKM 

CCCCACATTTTTCCTGCGCGTCATCTCTGACACGGCCT 
PTPPLRV ISDTASLCYS I LKAKMAS 

I 

CCGAAGAAAACATTTCTGTCGTGACTCCTGCGGTGCTTGGGTC 
EENILVVTPAVLGS 



GGGACAGCCAGAGATGGAGCCACCCCGCAGACCGTCGGGTGTGGGCAGCTTTCCGGTG^ 
GQPSM3PPRRPSGVGSPPV3PGRGVGLGL* 



FIG. IIS 



?1 ^in that lacks motif A (v^ 2) 

SS^S °> ^ °* °> ^ s > *° > 

GGPPSA?TTSVR^ . ^_,l^ arr , r ^ CGGCGC rGCCACTCAGGCCCGGCCCCCGCC 

GCrGGTTCACCTGCIO^^ V C G P P L Y Q I. G A A T Q 

CICiraAGKCCACCC^CTCGC^^ „ , „ , 0 T P . « » 

SL aP3I.TO»aaJ- - :.,^~r^C^GCTCKGCTCACCCCACCAGCCGGTCTCTQTGCCCO 

l^jWWW^^ V T P A A 0 V C A « 

M^u-ccicK*^^ . 0 H S S P - Q v * c . V . A c 

GACGTCGAAGATGACCCTGCGCCACTGC jCTTCtA. » . ?a V 3--'PAAEHRl." 

GATCAGTGTGTACtJTCCTCSACCTGCTCAGCTl- yTST 7?5*« il '--" PYR 

AATCAGACAGCACTTGAA<^GGGTGCAGCTGCGGGAGCTCjTC»*«AAGk-AG#*Cur^ ^ g , , , „ » , A t L T 8 » t. » » 

1 R 9 " L K 1 V ' ^c^CACACAA^^ 
C«WW^T«GrGAA^ 

„ L . » t V H " □ * * . . oGc^CCrTC^Cr^TGCGGGCCCAGGACCC^CGCCT^CCrGTACrr 



TGTCAAG DS--- 2 

° G 1 p Q G s 1 L • ,_^i 0BMr ~^*«^^ 

^rrrcrrsrr^CACcrcAC^ 
d ? l t v t p a l t h a ^.^---OTtiwciee^ 

,™«^«^^ T 1 T L E / ° • 

CrATGCCCOGACCTCCATCAGAGCCAGTCTCACC^CC^-G^C^: a „ „ , , K L I 8 V L * t * C 

TTrCCAOrrSAACACKCrCCA^^ ^ ^ q ^ y R , „ , c v L Q , P Q 

' ' ^^^^p-^-^st-^CATCCT^AAAGCCAAGAACGCAGGGATCTCGCTGGGGviCCAAGG^^ A G P I. P S E 

a^TrrnoctoowiioTCtewA^ K A x , » 0 „ , l o a < a a a _ 

P T P P , R V I S 0 T A _ - jic ___^ c ^ oc ^^ 

WCOTaCAGTC =crcr=ccACCAA^ t 0 , l . t a Q t 0 l a » « l 

avq mlchqafi* ^ 

GO^CGACGCrGACTCCCCTG^C^CAACCCG^C^-^CAGA ? K T I t* 0 
GTTUTAt*SAA AM -^^^ 

GAGTGTCCGGCTGAGGCCTGAGCGACTtJTCCAGCCAAGGGCTGAC7TT77CCAGCACACw . ^ c ^ cr rcCACC-^CCATCCAGGTCGAGACCC^AGAA 

c^ccc^cactccccacatac^t^^ 

FIG. 11T 




FIG. 11U 



. ru at lacks moti^( ver - ~ 

O 1. » G % „ S 6 « 0 * % r a G « » * T C ° . " ,«-r«rrciACGGGGCCCG 

* s p ° s \ % * g v b s * a g . wricaGcrrcQ^^ r 



2) 



CGGCGC< 
ft 



t G * Q 0 - 8 



T - 
^OGCGCGAAGAACGTGCTGGCt 
G A K » V L A 




tfCCCAAAGGGTCAGA 



F/G. II V 



Lacks 



(if A and altered C-termi^ (ver. 2) 



■ ^^^^ 

^^^^ 

HASGPRaRLGCS ..^rv^r r^^CCACCCCX^GGACC^GTGGACCGAGTGACCG 

CAGCCCAA^Cr^^ . . . . . - 

SRSLPLPKRPRR^ . . rrarr „„ ct7Ix ^ CGC CAGCACC^CGCCXX5CCCCCC 

CTCTCTGAGGCCCAGCCTGACTGGCGCT^GGAGGCTCGTCGAGA _ w-^ GSi?w! , pa TPaRI.P 
SLRPSLTGAaK'- " . . „^^- r . r ^^caTCACCCCAO»o:CGCrrGTCTOTGCCCG 

Q V * O * V * A C 

GACGTGGAA(^TGAGCGTGCGGGACTGCGCTTGGCTGCGCA 'v'*?" A A « H » L * > » I ^ A 

THKHSVR3CAWL . _ . ^ A C'GffiUtf»GT^^ 

• ^r-r^citrT^^ w s k i* Q s i g 

GATGAGTGTGTACGTCGTCGAGCTGCrCAGGTCT^CTTT^ vT3TT?QK ;,RL??^aKb 
M S V Y V V B t » S - . „,^ ia ^CAGGCCCGCCCTGCT^^ 

aa^gacagcact^^ 

1 » V" 1 K 1 v 0 L . 

CGGCCTCCGGCCGATT^ £ 3 2 X R A 2 R L T S R V K A 

G LaPlVM;4D ' - • ™^^rTGTGCGG<^CCAGGACCCGC^^ 

gcgggcgccgcg^^ 

TGTCAAG QRl.TBVIASriik'U- 

KAAHGHV3KAF .^^TGTGC^ACCACGCOTG^ 

xscc^™^^^ a t . t =. 

DPLLVTPHL.HA _ ^ . / -^ r -» T YV"TrTr"* , GGATAC CCGGACC CTGGAGGTGCAGAGCGACTACTC CAG 

. o . - » • 

VEDEALGGTAt^ * . w ,^_^~rT^GGCTGAAGTGTCACAGCCTGm 

•^^rAACCGCGGCTTCAAGGCTG^ C H S L P L D 

ctatgcccggacctccatcagagccagt^cacc^caaccgcwjC^ca^ a g r h m a a k l f g v l r l k c h 

YARTSlRASLTr < . - ' ^ CCCATrrC ATCAGCAAGTrTGGAACAA 

taVMSLOTVCTMIV* 

'• ^CCrCTC^CCATCCTCAA^ 

ccccACArrrrrccrcK^crcATc^CAC^crcOTcr^ACTCCA L , A K s A , 

p T , , L » V X « » UAAC^CATITC^CGTaACTCCI^^rCCrr^ 
OBGMMCCMABWt^^ , 0 » 9 V O L G L • 



ajml(7523) 



\ 



fi»NI(7154) 
Ba7nHI(6627) ^ 
Nco I (6573) ■ 

5si WI(6467) \ '' 

> 'i 

Spliced Exon Alpha \ 
RT Motif A \ 

Xho I (6285) 
Pae R7I (6285) 
Unspliced Intron 1 
Motif 2 
,4ar II (6175). 
Motif 1 
TeioBox / 
Msc I (5944) 
ft* AI (5654)' 
Eco 47HI (5473) 
flg/ H (4539) 
£coRI(4533) 

lac S/D 
lacUV5-10 
trp-35 
Sap I (4190) 



&/I(l) 



/ 



/ice I (2) 



Hind m (19) 
rrnB ter 




Bel I (1460) 
laclQ 

fljwl(1952) 



Sea 1 (2704) 
ampR 



ORI 



FIG. ISA 



LOCUS pAKI28.4 7615 bp dsDKA Circular 

DEFINITION Human telomerase clone with exon beta spliced out 



1 tcgacctgca ggcatgcaag cttggcactg gccgtcgttt tacaacgtcg tgactgggaa 

61 aaccctggcg ttacccaact taatcgcctt gcagcacatc cccctttcgc cagctggcgt 

121 aatagcgaag aggcccgcac cgatcgccct tcccaacagt tgcgcagcct gaatggcgaa 

181 tggcgcctga tgcggtattt tctccttacg catctgtgcg gtatttcaca ccgcataaat 

241 tccctgtttt ggcggatgag agaagatttt cagcctgata cagattaaat cagaacgcag 

301 aagcggtctg ataaaacaga atttgcctgg cggcagtagc gcggtggtcc cacctgaccc 

361 catgccgaac tcagaagtga aacgccgtag cgccgatggt agtgtggggt ctccccatgc 

421 gagagtaggg aactgccagg catcaaataa aacgaaaggc tcagtcgaaa gactgggcct 

481 ttcgttttat ctgttgtttg tcggtgaacg ctctcctgag taggacaaat ccgccgggag 

541 cggatttgaa cgttgcgaag caacggcccg gagggtggcg ggcaggacgc ccgccataaa 

601 ctgccaggca tcaaattaag cagaaggcca tcctgacgga tggccttttt gcgtttctac 

661 aaactcttcc tgtcgtcata tctacaagcc atccccccac agatacggta aactagcctc 

721 gtttttgcat caggaaagca gggaatttat ggtgcactct cagtacaatc tgctctgatg 

781 ccgcatagtt aagccagccc cgacacccgc caacacccgc tgacgcgccc tgacgggctt 



FIG. 13B 




841 gtctgctccc ggcatccgct; tacagacaag 
901 agaggttttc accgtcatca ccgaaacgcg 
961 ttttataggt taatgtcatg ataataatgg 
1021 ccatcgaatg gtgcaaaacc tttcgcggta 
1081 tcagggtggt gaatgrgaaa ccagtaacgt 
1141 cttatcagac cgtttcccgc gtggrgaacc 
1201 aaaaagtgga agcggcgatg gcggagcrga 
1261 tggcgggcaa acagtcgttg ctgattggcg 
1321 cgtcgcaaat tgtcgcggcg attaaatctc 
1381 tgtcgatggt agaacgaagc ggcgtcgaag 
1441 cgcaacgcgt: cagtgggctg atcattaact 
1501 tggaagctgc ctgcactaat gtrccggcgt 
1561 tcaacagtat tattttctcc catgaagacg 
1621 cattgggtca ccagcaaatc gcgctgttag 
1681 tgcgtctggc tggctggcat aaatatctca 
1741 gggaaggcga ctggagtgcc atgtccggtt 
1801 gcatcgttcc cactgcgatg ctggttgcca 
1861 ccattaccga gtccgggctg cgcgtrggtg 
1921 ccgaagacag ctcatgttat atcccgccgt 
1981 tggggcaaac cagcgtggac cgcrcgcrgc 
2041 atcagctgtt: gcccgrcrca crggcgaaaa 
2101 ccgcctctcc ccgcgcgtrg gccgacrca: 
2161 tggaaagcgg gcagtgagcg caacgcaact 
2221 caggctttac actctacgcr zccqaczzqc 
2281 ggaaatgtgc gcggaacccc tar::gt::a 
2341 ctcatgagac aataaccctg ataaa^gcrt 
2401 attcaacatt tccgtgrcgc cc:ra:::c: 
2461 gctcacccag aaacgc^ggt. gaaagtaaaa 
2521 ggttacatcg agaacrggat cccaacagcg 
2581 aacgttttcc aatgatgagc acr:::aaag 
2641 ttgacgccgg gcaagagcaa crcggtcgcc 
2701 agtactcacc agtcacagaa aagcancrra 
2761 gtgctgccat aaccatgagt gataacacrg 
2821 gaccgaagga gctaaccgct tt:t:gcaca 
2881 gttgggaacc ggagctgaat gaagccatac 
2941 tagcaatggc aacaacgrtg cgcaaacrat 
3001 ggcaacaatt aatagactgg acggaggcgg 
3061 cccttccggc tggctggttt attgcrgata 
3121 gtatcatrgc agcactgggg ccagacggra 
3181 cggggagtca ggcaactatg gatgaacgaa 
3241 tgattaagca ttggtaactg tcagaccaag 
3301 aacttcattt ttaatttaaa aggacctagg 
3361 aaatccctta acgrgagttt tcqnzccacz 
3421 gatcttcttg agatcctttt tttc-gcgcg 
3481 cgctaccagc ggtggttcgr ttgccgganc 
3541 ctggcttcag cagagcgcag ataccaaata 
3601 accacttcaa gaactctgta gcaccgccta 
3661 tggctgctgc cagtggcgat aagtcgtgtc 
3721 cggataaggc gcagcggtcg ggctgaacgg 
3781 gaacgaccta caccgaactg agatacctac 
3841 ccgaagggag aaaggcggac aggtatccgg 
3901 cgagggagct tccaggggga aacgccrggt: 
3961 tctgacttga gcgtcgattt trgtgatgcr 
4021 ccagcaacgc ggccttttta cggttccrgg 
4081 ttcctgcgtt atcccctgat tcrgtggata 
4141 ccgctcgccg cagccgaacg accgagcgca 
4201 gcccaatacg caaaccgcct ctccccgcgc 




etgtgaccgt ctccgggagc tgcatgtgtc 
cgagacgaaa gggcctcgtg atacgcctat 
tttcttagac gtgaggttct gtacccgaca 
tggcatgata gcgcccggaa gagagtcaat 
tatacgatgt cgcagagtat gccggtgtct 
aggccagcca cgtttctgcg aaaacgcggg 
attacattcc caaccgcgtg gcacaacaac 
ttgccacctc cagtctggcc ctgcacgcgc 
gcgccgatca actgggtgcc agcgtggtgg 
cctgtaaagc ggcggtgcac aatcttctcg 
atccgctgga tgaccaggat gccattgctg 
tatttcttga tgtctctgac cagacaccca 
gtacgcgact gggcgtggag catctggtcg 
cgggcccatt aagttctgtc tcggcgcgtc 
ctcgcaatca aattcagccg atagcggaac 
ttcaacaaac catgcaaatg ctgaatgagg 
acgatcagat ggcgctgggc gcaatgcgcg 
cggatatctc ggtagtggga tacgacgata 
taaccaccat caaacaggat tttcgcctgc 
aactctctca gggccaggcg gtgaagggca 
gaaaaaccac cctggcgccc aatacgcaaa 
taatgcagcr ggcacgacag gtttzcccgac 
aatgtaagtt agctcactca ttaggcaccc 
aagaacctca cgtcaggtgg cacttttcgg 
ttttcctaaa tacattcaaa tatgtatccg 
caataatatt gaaaaaggaa gagtatgagt 
ctttrtgcgg catttcgcct tcctgtcrtt 
gatgctgaag atcagttggg tgcacgagtg 
gtiaagatccc tgagagtttt cgccccgaag 
ttictgctatg tggcgcggta ttatcccgta 
gcatacacta ttctcagaar gacttggtcg 
cggatggcat gacagtaaga gaattatgca 
cggccaactc acttctgaca acgatcggag 
acacggggga ccatgtaact cgccttgatc 
caaacgacga gcgtgacacc acgatgcctg 
taactggcga actacttact ctagcttccc 
ataaagttgc aggaccactt ctgcgctcgg 
aatctggagc cggtgagcgt gggtctcgcg 
agccctcccg tatcgtagtt atctacacga 
atagacagat cgctgagata ggtgcctcac 
tttactcata tatactttag attgatttaa 
tgaagatccr ttttgataat ctcatgacca 
gagcgtcaga ccccgtagaa aagatcaaag 
taarctgctg cttgcaaaca aaaaaaccac 
aagagctacc aactcttttt ccgaaggtaa 
ctgtccttct agtgtagccg tagttaggcc 
catacctcgc tctgctaatc ctgttaccag 
traccgggtt ggactcaaga cgatagttac 
ggggttcgtg cacacagccc agcttggagc 
agcgtgagca ttgagaaagc gccacgcttc 
taagcggcag ggtcggaaca ggagagcgca 
atctttatag tcctgtcggg tttcgccacc 
cgrcaggggg gcggagccta tggaaaaacg 
ccttttgctg gccttttgct cacatgttct 
accgtattac cgcctttgag tgagctgata 
gcgagtcagt gagcgaggaa gcggaagagc 
gttggccgat tcattaatgc agaattaatt 
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4261 ctcatgttrg acagcttatc atcgactgca cggtgcacca atgcttctgg cgtcaggcag 
4321 ccatcggaag ctgtggtatg gctgtgcagg tcgtaaatca ctgcataatt cgtgtcgctc 
4381 aaggcgcact: cccgtrctgg ataatgttcr ttgcgccgac atcataacgg ttctggcaaa 
4441 tattctgaaa tgagctgttg acaattaatc atcggctcgt ataatgtgtg gaattgtgag 
4501 cggataacaa tttcacacag gaaacagcga tgaattcaga tctcaccatg aaggagctgg 
4561 tggcccgagt gctgcagagg ctgtgcgagc gcggcgcgaa gaacgtgctg gccttcggct 
4621 tcgcgcrgcr ggacggggcc cgcgggggcc cccccgaggc cttcaccacc agcgtgcgca 
4681 gctacctsgcc caacacggtg accgacgcac tgcgggggag cggggcgtgg gggctgctgc 
4741 tgcgccgcgt gggcgacgac gtgcrggtrc acctgctggc acgctgcgcg ctctttgtgc 
4801 tggtggcrcc cagctgcgcc taccaggtgt: gcgggccgcc gctgtaccag ctcggcgctg 
4861 ccactcaggc ccggcccccg ccacacgctia gtggaccccg aaggcgtctg ggatgcgaac 
4921 gggcctggaa ccatagcgtc agggaggccg gggtccccct gggcctgcca gccccgggtg 
4981 cgaggaggcg cgggggcagt gccagccgaa gtctgccgtt gcccaagagg cccaggcgtg 
5041 gcgctgcccc tgagccggag cggacgcccg ttgggcaggg gtcctgggcc cacccgggca 
5101 ggacgcgtgg accgagtgac cqzqqzzzzz gtgtggtgtc acctgccaga cccgccgaag 
5161 aagccacctc tttggagggt qcqczczzzq gcacgcgcca ctcccaccca tccgtgggcc 
5221 gccagcacca cgcgggcccc ccatccacat cgcggccacc acgtccctgg gacacgcctt 
5281 gtcccccggt gtacgccgag accaagcac: tccrctactc ctcaggcgac aaggagcagc 
5341 zqcqqcczzz cttcctactc aqczzzzzqa ggcccagcct gactggcgct cggaggctcg 
5401 tggagaccat czzzzzqqqz tccaggccc- ggatgccagg gactccccgc aggttgcccc 
5461 gcctgcccca gcgcractgg caaatgcggc czzzqzzzzz ggagctgctt gggaaccacg 
5521 cgcagtgccc ctacggggtg c-cctcaaga cgcactgccc gctgcgagct gcggtcaccc 
5581 cagcagccgg zqZzzqzqcz cgggacaagc cccagggctc tgtggcggcc cccgaggagg 
5641 aggacacaga czzzzqzzqz czqqzqzaqz cgctccgcca gcacagcagc cccrggcagg 
5701 tgracggctc cgrgcgggcc zqczzqczzz qqczggzqcc cccaggcctc tggggcrcca 
5761 ggcacaacga acgccgcttc c-caggaaca ccaagaagtt: catctccctg gggaagcatg 
5821 zzaaqzzzzz gcrgcaggag c~gacgzgga agatgagcgt gcgggaccgc gctitggcrgc 
5881 gcaggagccc aqqgqzzqgz zqzqzzzzqq ccgcagagca ccgtctgcgt gaggagatcc 
5941 tggccaagtr cctgcactgg ctgargagrg tgracgtcgr cgagctgctc aggtctttct 
6001 tttatgtcac ggagaccacg :tt:aaaaga acaggctctt tttctaccgg aagagtgtct 
6061 ggagcaagtt gcaaagcact ggaa—agac agcacttgaa gagggtgcag ctgcgggagc 
6121 tgrcggaagc agaggtcagg cagcaccggg aagccaggcc cgccctgctg acgtccagac 
6181 tccgccrcat czzzaaqzzz gacgggc.gc ggccgattgt gaacatggac tacgtcgtgg 
6241 gagccagaac gttccgcaga gaaaagaggg ccgagcgtct cacctcgagg gtgaaggcac 
6301 tgrtcagcgt gctcaactac gagcgggcgc ggcgccccgg cctcctgggc gcctctgtgc 
6361 tgggcctgga cgaratccac agggcc-ggc gcaccttcgt gctgcgtgtg cgggcccagg 
6421 acccgccgcc tgagcrgtac c~cg-caagg tggatgtgac gggcgcgrac gacaccatcc 
6481 cccaggacag gctcacggag gteazcgcca gcatcatcaa accccagaac acgtactgcg 
6541 tgcgtcggra tgccgtggtc cagaaggccg cccatgggca cgtccgcaag gccttcaaga 
6601 gccacgtccr acgrccagtg ccagggga-c ccgcagggct ccatcctctc cacgctgctc 
6661 tgcagccrgt gctacggcga cacggagaac aagctgtttg cggggattcg gcgggacggg 
6721 ctgctcctgc gtttggrgga tgactts—g ttggtgacac ctcacctcac ccacgcgaaa 
6781 acttccccag qacczqqzcz qaaqzqzzzz gagtatggct gcgtggtgaa ctcgcggaag 
6841 acagtggtga aczzczzzqz agaagacgaa gccctgggtg gcacggcttt tgttcagatg 
6901 ccggcccacg qcztazzzzz c-ggrgcggc ctgctgctgg atacccggac cctggaggtg 
6961 cagagcgact: acrccagcta tgcccggacc tccatcagag ccagtctcac cttcaaccgc 
7021 ggcttcaagg ctgggaggaa catgcg—gc aaactctttg gggtcttgcg gctgaagtgt 
7081 cacagccrgt tzczqqazzz gcaggrgaac agcctccaga cggtgtgcac caacatctac 
7141 aagatccrcc tgctgcaggc gtacagg—- cacgcatgrg tgctgcagct cccatttcat 
7201 cagcaagtrt ggaagaaccc zazazzzzzz ctgcgcgtca tctctgacac ggcctccctc 
7261 tgctacrcca tccrgaaagc caagaacgca gccgaagaaa acatrtctgt cgtgactcct 
7321 gcggtgcttg ggtcgggaca gccagaga-g gagccacccc gcagaccgtc gggtgtgggc 
7381 agctttccgg tqzzzcczgq qaqqqqaqzz gggctgggcc tgtgactcct cagcctctgt 
7441 tttcccccag ggatgtcgct gggggccaag ggcgccgccg gccctctgcc ctccgaggcc 
7501 gtgcagtggc tgtgccacca agcat-cc-g ctcaagctga ctcgacaccg tgtcacctac 
7561 gtgccactcc tggggtcact caggacaggc aagtgtgggt ggaggccagt gcggg 
D:\Vector NTI\pAKX23 . 4 . gb 
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LOOTS pAKI28.7 7797 bp dsDHA Circular 

DEFINITION Human telamerase clone with alternative C-terminus 



1 tcgacctgca ggcatgcaag cttggcactg 
61 aaccctggcg ttacccaact taatcgcctt 
121 aatagcgaag aggcccgcac cgatcgccct 
181 tggcgcctga tgcggtattt tctccttacg 
241 tccctgtttt ggcggatgag agaagatttt 
301 aagcggtctg ataaaacaga atttgcctgg 
361 catgccgaac tcagaagtga aacgccgtag 
421 gagagtaggg aactgccagg catcaaataa 
481 ttcgttttat ctgttgtttg tcggtgaacg 



gccgtcgttt tacaacgtcg tgactgggaa 
gcagcacatc cccctttcgc cagctggcgt 
tcccaacagt tgcgcagcct gaatggcgaa 
catctgtgcg gtatttcaca ccgcataaat 
cagcctgata cagattaaat cagaacgcag 
cggcagtagc gcggtggtcc cacctgaccc 
cgccgatggt agtgtggggt ctccccatgc 
aacgaaaggc tcagtcgaaa gactgggcct 
ctctcctgag taggacaaat ccgccgggag 
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541 cggatttgaa cgttgcgaag caacggcccg gagggtggcg ggcaggacgc ccgccataaa 
601 ctgccaggca tcaaattaag cagaaggcca tcctgacgga tggccttttt gcgtttctac 
661 aaactcttcc tgtcgtcata tctacaagcc atccccccac agatacggta aactagcertc 
721 gtttttgcat caggaaagca gggaatttat ggtgcactct cagtacaatc tgctctgatg 
781 ccgcatagtt aagccagccc cgacacccgc caacacccgc tgacgcgccc tgacgggctt 
841 gtctgctccc ggcatccgct tacagacaag ctgtgaccgt ctccgggagc tgcatgtgtc 
901 agaggttttc accgtcatca ccgaaacgcg cgagacgaaa gggcctcgtg atacgcctat 
961 ttttataggt taatgtcatg ataataatgg tttcttagac gtgaggttct gtacccgaca 
1021 ccatcgaatg gtgcaaaacc tttcgcggi;a tggcatgata gcgcccggaa gagagtcaat 
1081 tcagggtggt gaatgtgaaa ccagtaacgt tatacgatgt cgcagagtat gccggtgtct 
1141 cttatcagac cgtttcccgc gtggtgaacc aggccagcca cgtttctgcg aaaacgcggg 
1201 aaaaagtgga agcggcgatg gcggagcrga attacattcc caaccgcgtg gcacaacaac 
1261 tggcgggcaa acagtcgttg crgattggcg ttgccacctc cagtctggcc ctgcacgcgc 
1321 cgtcgcaaat tgtcgcggcg attaaatctc gcgccgatca actgggtgcc agcgtggtgg 
1381 tgtcgatggt agaacgaagc ggcgtcgaag cctgtaaagc ggcggtgcac aatcttctcg 
1441 cgcaacgcgr cagtgggctg atcattaacr atccgctgga tgaccaggat gccattgctg 
1501 tggaagctgc ctgcactaat gttccggcgt tatttcttga tgtctctgac cagacaccca 
1561 tcaacagtat tattttctcc catgaagacg gtacgcgact gggcgtggag catctggtcg 
1621 cattgggtca ccagcaaatc gcgcrgt-ag cgggcccatt aagttctgtc tcggcgcgtc 
1681 tgcgtctggc tggctggcat aaatatctca ctcgcaatca aattcagccg atagcggaac 
1741 gggaaggcga ctggagrgcc acgtccggtir trcaacaaac catgcaaatg ctgaatgagg 
1801 gcatcgtrcc cactgcgatg c-ggrrgcca acgatcagat ggcgctgggc gcaatgcgcg 
18 61 ccatcaccga gtccgggctg cgcgtcggrg cggatatctc ggtagtggga tacgacgata 
1921 ccgaagacag ctcatgrtar accccgccg- taaccaccat caaacaggat tttcgcctgc 
1981 tggggcaaac cagcgrggac cgcrrgc-gc aactctctca gggccaggcg gtgaagggca 
2041 atcagctgrt gcccgtcrca crggrgaaaa gaaaaaccac cctggcgccc aatacgcaaa 
2101 ccgcctctcc ccgcgcgtrg gccgactca: taatgcagct: ggcacgacag gtttcccgac 
2161 tggaaagcgg gcagtgagcg caacgcaacr aatgraagrt agctcactca ttaggcaccc 
2221 caggczttac act—atgcc tccgacc-gc aagaacctca cgtcaggtgg cacttttcgg 
2281 ggaaatgtgc gcggaacccc tartr-g-rra tttttctaaa tacattcaaa tatgtatccg 
2341 ctcatgagac aaraaccctg araaatgct: caataatatt gaaaaaggaa gagtatgagt. 
2401 attcaacatt tccgtgccgc ccttattccc ttttttgcgg cattttgcct tcctgttttt 
2461 gctcacccag aaacgccggr gaaagcaaaa gatgctgaag atcagttggg tgcacgagtg 
2521 ggttacaccg agaactggat crcaacagcg gtaagatcct tgagagtttt cgccccgaag 
2581 aacgttttcc aatgacgagc acrzttaaag ttctgctatg tggcgcggta ttatcccgta 
2641 ttgacgccgg gcaagagcaa crcggtcgcc gcatacacta ttctcagaat gacttggttg 
2701 agtactcacc agtcacagaa aagcatc-a cggatggcat gacagtaaga gaattacgca 
2761 gtgcrgccat aaccatgagt gataacaczg cggccaactt acttctgaca acgatcggag 
2821 gaccgaagga gctaaccgct trctrgcaca acatggggga tcatgtaact cgccttgatc 
2881 gttgggaacc ggagctgaat gaagccacac caaacgacga gcgtgacacc acgatgcctg 
2941 tagcaatggc aacaacgttg cgcaaactat taactggcga actacttact ctagcttccc 
3001 ggcaacaatt aatagactgg arggaggcgg ataaagttgc aggaccactt ctgcgctcgg 
3061 cccttccggc tggctggttt attgcrgaca aarctggagc cggtgagcgt gggtctcgcg 
3121 gtatcattgc agcactgggg ccagarggta agccctcccg tatcgtagtt atctacacga 
3181 cggggagtca ggcaacratg gacgaacgaa atagacagat cgctgagata ggtgcctcac 
3241 tgattaagca ttggtaactg tcagaccaag tttactcata tatactttag attgatttaa 
3301 aacttcattt ttaatttaaa aggatcragg tgaagatcct ttttgataat ctcatgacca 
3361 aaatccctta acgtgagttt tcgttccact gagcgtcaga ccccgtagaa aagatcaaag 
3421 gatcttcttg agatcctttt trtctgcgcg taatctgcrg cttgcaaaca aaaaaaccac 
3481 cgctaccagc ggtggtttgt ttgccgcarc aagagctacc aactcttttt ccgaaggtaa 
3541 ctggcttcag cagagcgcag ataccaaara ctgtccttct agtgtagccg tagttaggcc 
3601 accacttcaa gaactctgta gcaccgccta catacctcgc tctgctaatc ctgttaccag 
3661 tggcrgctgc cagtggcgat aagtcgtgrc ttaccgggtt ggactcaaga cgatagttac 
3721 cggataaggc gcagcggtcg ggctgaacgg ggggttcgtg cacacagccc agcttggagc 
3781 gaacgaccta caccgaactg agatacccac agcgtgagca ttgagaaagc gccacgcttc 
3841 ccgaagggag aaaggcggac aggtatccgg taagcggcag ggtcggaaca ggagagcgca 
3901 cgagggagct tccaggggga aacgcctggr atctttatag tcctgtcggg tttcgccacc 
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cgcagtgccc 
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tttatgtcac 
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tgtcggaagc 
tccgcttcat 
gagccagaac 
tgttcagcgt 
tgggcctgga 
acccgccgcc 
cccaggacag 
tgcgtcggta 
gccacgtctc 
aggagaccag 
ccagcagtgg 
ggggcaagtrc 
tctgcagcct 
ggctgctcct 
aaacttcctc 
agacagtggt 
tgccggccca 
tgcagagcga 
gcggctccaa 
gtcacagcct 
acaagatcct 



gcgtcgat ct 
ggcctttrta 
atcccctgat 
cagccgaacg 
caaaccgcct 
acagcttatc 
ctgtggtatg 
cccgttctgg 
tgagctgttg 
tttcacacag 
gctgcagagg 
ggacggggcc 
caacacggrg 
gggcgacgac 
cagctgcgcc 
ccggcccccg 
ccatagcgtc 
cgggggcagr 
tgagccggag 
accgagtgac 
tttggagggr 
cgcgggcccc 
gtacgccgag 
cttcctactc 
ctttcrgggr 
gcgctacrgg 
ctacgggg~g 
tgtctgtgcc 
cccccgtcgc 
cgtgcgggcc 
acgccgcr-c 
gctgcaggag 
aggggttggc 
cctgcactgg 
ggagaccacg 
gcaaagcac - 
agaggtcagg 
ccccaagcct 
gttccgcaga 
gctcaactac 
cgatatccac 
tgagctgtac 
gctcacggag 
tgccgtggtc 
taccttgaca 
cccgctgagg 
cctcttcgac 
ctacgtccag 
gtgctacggc 
gcgtttggtg 
aggacctggr 
gaacttcccr 
cggcctattc 
ctactccagc 
ggctgggagg 
gtttctggat 
cctgctgcag 



ttgrgacgcr 
cggtrccrgg 
tctgtggata 
accgagcgca 
ctccccgcgc 
atcgactgca 
gctgtgcagg 
ataargrrtt: 
acaattaatc 
gaaacagcga 
ctgtgcgagc 
cgcgggggcc 
accgacgcac 
gtigcrggrrc 
taccaggrgr 
ccacacgcta 
agggaggccg 
gccagccgaa 
cggacgcccg 
cgrgg---c- 
gcgc-c-c-g 
eca"caca- 
accaaccac- 
agctic ".ga 
rccaggcrc- 
caaacncczac 



ctcctcaaga 
cgggagaagc 
ctggcgcagc 
tgcccgcgcc 
crcaggaaca 
crgacg-gga 
"gtg" ccgg 
crgaugag-g 
titcaaaaga 
ggaarcagac 
cagcaccggg 
gacgggc »gc 
gaaaagaggg 
gagcgggcgc 
agggcc-ggc 
ctcgrcaagg 
gtcaTicgcca 
cagaaggccg 
gaccrccagc 
gargccgrcg 
gtcrtccrac 
tgccagggga 
gacacggaga 
gatga""- 
ccgaag-g— 
gtagaagacg 
cccrggrgcg 
tatgcccgca 
aacat:gcg::c 
ttgcagg-ga 
gcgtacaggr 



cgtcaggggg 
ccttttgctg 
accgtattac 
gcgagtcagt 
gttggccgat 
cggtgcacca 
tcgtaaatca 
ttgcgccgac 
atcggctcgt 
tgaattcaga 
gcggcgcgaa 
cccccgaggc 
tgcgggggag 
acctgctggc 
gcgggccgcc 
gtggaccccg 
gggtccccct 
gtctgccgtt 
ttgggcaggg 
gtgtggtgtzc 
gcacgcgcca 
cgcggccacc 
tcctctactc 
ggcccagcct 
ggargccagg 
cccrgtttct: 
cgcactgccc 
cccagggcrc 
tgctccgcca 
ggctggtgcc 
ccaagaagtt 
agacgagcgt 
ccgcagagca 
tgracgtcgt 
acaggcrctt 
agcacttgaa 
aagccaggcc 
ggccgattgt 
ccgagcgtct 
ggcgccccgg 
gcaccttcgt 
tggatgtgac 
gcatcatcaa 
cccatgggca 
cgtacatgcg 
tcatcgagca 
gcttcatgtg 
tcccgcaggg 
acaagctgtt 
tgttggtgac 
ctgagtatgg 
aagccctggg 
gccrgctgct 
ccrccatcag 
gcaaactctt 
acagcctcca 
crcacgcatg 



gcggagccta 
gccttttgct 
cgcctttgag 
gagcgaggaa 
tcattaatgc 
atgcttctgg 
ctgcataatt 
atcataacgg 
ataatgtgtg 
tctcaccatg 
gaacgtgctg 
cttcaccacc 
cggggcgtgg 
acgctgcgcg 
gctgtaccag 
aaggcgtctg 
gggcctgcca 
gcccaagagg 
gtcctgggcc 
accrgccaga 
ctcccaccca 
acgtccctgg 
ctcaggcgac 
gactggcgct 
gaccccccgc 
ggagcrgcrt 
gctgcgagct 
tgtggcggcc 
gcacagcagc 
cccaggcctc 
catctccctg 
gcgggactgc 
ccgtctgcgt 
cgagctgctc 
tttctaccgg 
gagggtgcag 
cgccctgctg 
gaacatggac 
cacctcgagg 
cctcctgggc 
gctgcgtgtg 
gggcgcgtac 
accccagaac 
cgtccgcaag 
acagrtcgtg 
gagctcctcc 
ccaccacgcc 
ctccatcctc 
tgcggggatt 
acctcacctc 
ctgcgtggtg 
tggcacggct 
ggatacccgg 
agccagtctc 
tggggtcttg 
gacggtgtgc 
tgtgctgcag 



tggaaaaacg 
cacatgttct 
tgagctgata 
gcggaagagc 
agaattaatt 
cgtcaggcag 
cgtgtcgctc 
ttctggcaaa 
gaattgtgag 
aaggagctgg 
gccttcggct 
agcgtgcgca 
gggctgctgc 
ctctttgtgc 
ctcggcgctg 
ggatgcgaac 
gccccgggtg 
cccaggcgtg 
cacccgggca 
cccgccgaag 
tccgrgggcc 
gacacgcctt 
aaggagcagc 
cggaggctcg 
aggttgcccc 
gggaaccacg 
gcggtcaccc 
cccgaggagg 
ccctggcagg 
tggggctcca 
gggaagcatg 
gcttggctgc 
gaggagatcc 
aggtctttct 
aagagtgtct 
ctgcgggagc 
acgtccagac 
tacgtcgtgg 
gtgaaggcac 
gcctctgtgc 
cgggcccagg 
gacaccatcc 
acgtactgcg 
gccttcaaga 
gctcacctgc 
ctgaatgagg 
gtgcgcatca 
tccacgctgc 
cggcgggacg 
acccacgcga 
aacttgcgga 
tttgttcaga 
accctggagg 
accttcaacc 
cggctgaagt 
accaacatct 
ctcccatttc 
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7381 atcagcaagt ttggaagaac cccacatttt 
7441 tctgctactc catcctgaaa gccaagaacg 
7501 ctgcggtgct tgggtcggga cagccagaga 
7561 gcagctttcc ggtgtctcct gggaggggag 
7621 gttttccccc agggatgtcg ctgggggcca 
7681 ccgtgcagtg gcngtgccac caagcattcc 
7741 acgtgccact cctggggtca ctcaggacag 




tcctgcgcgt catctctgac acggcctccc 
cagccgaaga aaacatttct gtcgtgactc 
tggagccacc ccgcagaccg tcgggtgtgg 
ttgggctggg cctgtgactc ctcagcctct 
agggcgccgc cggccctctg ccctccgagg 
tgctcaagct gactcgacac cgtgtcacct 
gcaagtgtgg gtggaggcca gtgcggg 
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LOCUS pAKI28.14 7688 bp daDNA Circular 

DEFINITION Human telomerase clone with exon alpha spliced out 



1 tcgacctgca ggcatgcaag cttggcactg gccgtcgttt tacaacgtcg tgactgggaa 
61 aaccctggcg ttacccaact taatcgcctt gcagcacatc cccctttcgc cagctggcgt 
121 aatagcgaag aggcccgcac cgatcgccct tcccaacagt tgcgcagcct gaatggcgaa 
181 tggcgcctga tgcggtattt tctccttacg catctgtgcg gtatttcaca ccgcataaat 
241 tccctgtttt ggcggatgag agaagatttt cagcctgata cagattaaat cagaacgcag 
301 aagcggtctg ataaaacaga atttgcctgg cggcagtagc gcggtggtcc cacctgaccc 
361 catgccgaac tcagaagtga aacgccgtag cgccgatggt agtgtggggt ctccccatgc 
421 gagagtaggg aactgccagg catcaaataa aacgaaaggc tcagtcgaaa gactgggcct 
481 ttcgttttat ctgttgtttg tcggtgaacg ctctcctgag taggacaaat ccgccgggag 
541 cggatttgaa cgttgcgaag caacggcccg gagggtggcg ggcaggacgc ccgccataaa 
SOI ctgccaggca tcaaattaag cagaaggcca tcctgacgga tggccttttt gcgtttctac 
661 aaactcttcc tgtcgtcata tctacaagcc atccccccac agatacggta aactagcctc 
721 gtttttgcat caggaaagca gggaatttat ggtgcactct cagtacaatc tgctctgatg 
781 ccgcatagtt aagccagccc cgacacccgc caacacccgc tgacgcgccc tgacgggctt 
841 gtctgctccc ggcatccgct tacagacaag ctgtgaccgt ctccgggagc tgcatgtgtc 
901 agaggtttrc accgtcatca ccgaaacgcg cgagacgaaa gggcctcgtg atacgcctat 
961 ttttataggt taatgtcatg ataataatgg tttcttagac gtgaggttct gtacccgaca 
1021 ccatcgaatg gtgcaaaacc tttcgcggta tggcatgata gcgcccggaa gagagtcaat 
1081 tcagggtggt gaatgtgaaa ccagtaacg- tatacgatgt cgcagagtat gccggtgtc^ 
1141 cttatcagac cgtttcccgc gtgg-gaacc aggccagcca cgtttctgcg aaaacgcggg 
1201 aaaaagcgga agcggcgatg gcggagc.ga atcacatrcc caaccgcgtg gcacaacaac 
1261 tggcgggcaa acagt=gt-g crga-cggcg ttgccacccc cagtctggcc ctgcacgcgc 
1321 cgtcgcaaat tgrcgcggcg attaaa~- = gcgccgatca actgggtgcc agcgtggtgg 
1381 tgtcgacggt agaacgaagc ggcgtcgaag cccgtaaagc ggcggtgcac aatcttctcg 
1441 cgcaacgcgt cagtgggc^g a-cac.aac- atccgctgga tgaccaggat gccattgctg 
1501 tggaagctgc ctgcacraat g«c=ggcgt tacttcttga tgtcrctgac 
1561 tcaacagtat tactttctcc catgaagacg gtacgcgact gggcgtggag catcggtcg 
1621 cattgggtca ccagcaaatc gcgctg~ag cgggcccatt aagttctgtc tcggcgcgtc 
1631 tgcgtctggc tggctggcat aaacat-.ca ctcgcaacca aattcagccg atagcggaac 
1741 gggaaggcga ctggagtgcc atgtccggtt ttcaacaaac catgcaaatg =«-9"tgagg 
1801 gcatcgttcc cactgcgacg ctggtrgcca acgatcagat ggcgctgggc gcaatgcgcg 
18 61 ccattaccga gtccgggctg cgcgttggtg cggatacctc ggtagtggga tacgacgata 
1921 ccgaagacag ctcangt-an atcccgccg- taaccaccat caaacaggat t.tcgcctgc 
1981 tggggcaaac cagcgrggac cgcttgc-.gc aactctctca gggccaggcg gtgaagggca 
2041 atcagctgt- gcccgtctca c-ggtgaaaa gaaaaaccac cctggcgccc aatacgcaaa 
2101 ccgcctctcc ccgcgcgttg gccgatt=a. -aatgcagct ggcacgacag gtttcccgac 
2161 tggaaagcgg gcagtgagcg caacgcaac. aatgtaagtt agctcactca ttaggcaccc 
2221 caggctttac actttatgct tccgacc-gc aagaacctca cgtcaggtgg cacttttcgg 
2281 ggaaatgtgc gcggaacccc tatttgt"a tttttctaaa tacattcaaa tatgtatccg 
2341 c-catgagac aataaccctg ataaatgctc caataatatt gaaaaaggaa gagtatgagt 
2401 attcaacatt tccgtgtcgc ccttattccc ttttttgcgg cattttgcct tcctgttttt 
2461 gccacccag aaacgctggt gaaag-aaaa gangctgaag atcagttggg tgcacgagtg 
2521 qqttacaccg agaactggar ctcaacagcg gtaagatcct tgagagtttt cgccccgaag 
2581 aacgttttcc aatgatgagc acttttaaag "ctgctatg tggcgcggta ttatcccgta 
264i ttqacgccgg gcaagagcaa ctcgg~gc= gcatacacta ttctcagaat gac.tggtug 
2701 agtactcacc agtcacagaa aagca^c.ca cggatggcat gacagtaaga gaattatgca 
2761 gtgctgccat aaccatgagt gataacactg cggccaactt acttctgaca acgatcggag 
2821 gaccgaagga gctaaccgct cttttgcaca acatggggga tcatgtaact cgcctv.gatc 
2881 gttgggaacc ggagctgaat gaagccacac caaacgacga gcgtgacacc acgatgcctg 
2941 tagcaatggc aacaacgttg cgcaaactat taactggcga actacttact ctagcttccc 
3001 ggcaacaatt aatagactgg atggaggcgg ataaagttgc aggaccactt ctgcgc-cgg 
3061 cccttccggc tggctggttc attgccgaca aatctggagc cggtgagcgt gggtccgcg 
3121 gtatcattgc agcactgggg ccagacggta agccctcccg tatcgtagtt atctacac^a 
3181 cggggagtca ggcaactatg gatgaacgaa atagacagat cgctgagata ggtgcc-cac 
3241 tgattaagca ttggtaactg tcagaccaag tttactcata tatactttag a "gat^aa 
3301 aacttcattt ttaatttaaa aggatctagg tgaagatcct ttttgataac ctcatgacca 
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3361 aaatccctta acgtgagttt tcgtrccact 
3421 gatcttcttg agatcctttt ttrcrgcgcg 
3481 cgctaccagc ggUggtrtgt ttgccggatc 
3541 ctggcttcag cagagcgcag ataccaaata 
3601 accacttcaa gaactctgta gcaccgccta 
3661 tggctgctgc cagtggcgat aagtcgtgtc 
3721 cggataaggc gcagcggtcg ggcrgaacgg 
3781 gaacgaccta caccgaactg agatacctac 
3841 ccgaagggag aaaggcggac aggtatccgg 
3901 cgagggagct tccaggggga aacgcctggt 
3961 tctgacttga gcgtcgatut ttgHgatgct 
4021 ccagcaacgc ggccttttta cggttcctgg 
4081 ttccrgcgtt atcccctgat tctgtggata 
4141 ccgctcgccg cagccgaacg accgagcgca 
4201 gcccaatacg caaaccgcct crccccgcgc 
4261 ctcatgtttg acagcttatc atcgactgca 
4321 ccatcggaag ctgtggtatg gcrgtgcagg 
4381 aaggcgcact cccgttctgg ataargrttt 
4441 tattctgaaa tgagctigttg acaartaatc 
4501 cggataacaa tttcacacag gaaacagcga 
4561 tggcccgagt gcrgcagagg ctgcgcgagc 
4621 tcgcgcrgct ggacggggcc cgcgggggcc 
4681 gctaccrgcc caacacgctg accgacgcac 
4741 tgcgccgcgt gggcgacgac grgczggtrc 
4801 tggnggctcc cagctgcgcc taccaggrgt 
4861 ccactcaggc ccggcccccg ccacacgcta 
4921 gggcctggaa ccatagcgrc agggaggccg 
4981 cgaggaggcg cgggggcagt gccagccgaa 
5041 gcgcrgcccc tgagccggag cggacgcccg 
5101 ggacgcgtgg accgagtgac cgtgg"tct 
5161 aagccacctc tttggaggg- gcgc-czcrg 
5221 gccagcacca cgcgggcccc cca^ccacat 
5281 gtcccccggr gracgccgag accaagcact 
5341 tgcggccctc cttcctac-c agctc-ctga 
5401 tggagaccat: ctttctgggt cccaggcccn 
5461 gccrgcccca gcgcractgg caaacgcggc 
5521 cgcagtgccc ctacggggtg crcc-caaga 
5581 cagcagccgg tgtctgtgcc cgggagaagc 
5641 aggacacaga cccccgtcgc crggrgcagc 
5701 tgtacggctt cgtgcgggcc tgccrgcgcc 
5761 ggcacaacga acgccgcttc ctcaggaaca 
5821 ccaagctctc gctgcaggag crgacgrgga 
5881 gcaggagccc aggggttggc tgtgrzccgg 
5941 tggccaagtt cctgcactgg ctgatgagtg 
6001 tttatgtcac ggagaccacg ttrcaaaaga 
6061 ggagcaagtr gcaaagcact ggaaccagac 
6121 tgtcggaagc agaggccagg cagcatcggg 
6131 tccgctrcat ccccaagcct gacgggcrgc 
6241 gagccagaac gttccgcaga gaaaagaggg 
6301 tgttcagcgt gctcaactac gagcgggcgc 
6361 tgggcctgga cgatatccac agggcczggc 
6421 acccgccgcc tgagctgtac trtgncaagg 
6481 tcaaacccag aacacgtact gcgtgcgrcg 
6541 gcacgtccgc aaggccttca agagccacgt 
6601 gcgacagttc gtggctcacc ' tgcaggagac 
6661 gcagagctcc tccctgaatg aggccagcag 
6721 gtgccaccac gccgtgcgca tcaggggcaa 



gagcgtcaga ccccgtagaa aagatcaaag 
taatctgctg cttgcaaaca aaaaaaccac 
aagagctacc aactct.tttt ccgaaggtaa 
ctgtccttct agtgtagccg tagttaggcc 
catacctcgc tctgctaatc ctgttaccag 
ttaccgggtt ggactcaaga cgatagttac 
ggggttcgtg cacacagccc agcttggagc 
agcgtgagca ttgagaaagc gccacgcttc 
taagcggcag ggtcggaaca ggagagcgca 
atctttatag tcctgtcggg tttcgccacc 
cgtcaggggg gcggagccta tggaaaaacg 
ccttttgctg gccttttgct cacatgttct 
accgtattac cgcctttgag tgagctgata 
gcgagtcagt gagcgaggaa gcggaagagc 
gttggccgat tcattaatgc agaattaatt 
cggtgcacca atgcttctgg cgtcaggcag 
tcgtaaatca ctgcataatt cgtgtcgctc 
ttgcgccgac atcataacgg ttctggcaaa 
atcggctcgt ataatgtgtg gaattgtgag 
tgaattcaga tctcaccatg aaggagcrgg 
gcggcgcgaa gaacgtgctg gccttcggcr 
cccccgaggc cttcaccacc agcgtgcgca 
tgcgggggag cggggcgtgg gggctgcrgc 
acctgc-ggc acgctgcgcg ctctttgrgc 
gcgggccgcc gctgtaccag ctcggcgcrg 
gtggaccccg aaggcgtctg ggacgcgaac 
gggtcccccc gggcctgcca gccccgggrg 
gtctgccgtt gcccaagagg cccaggcgtg 
ttgggcaggg gtcctgggcc cacccgggca 
gtgtggtgtc acctgccaga cccgccgaag 
gcacgcgcca ctcccaccca tccgtgggcc 
cgcggccacc acgtccctgg gacacgcctt 
tcctctactc ctcaggcgac aaggagcagc 
ggcccagcct gactggcgct cggaggctcg 
ggatgccagg gactccccgc aggttgcccc 
ccctgtttct ggagctgctt gggaaccacg 
cgcactgccc gctgcgagct gcggtcaccc 
cccagggctc tgrggcggcc cccgaggagg 
tgcrccgcca gcacagcagc ccctggcagg 
ggcrggtgcc cccaggcctc tggggctcca 
ccaagaagtt catctccctg gggaagcatg 
agatgagcgt gcgggactgc gcttggctgc 
ccgcagagca ccgtctgcgt gaggagatcc 
tgtacgtcgt cgagctgctc aggtc-ttcr 
acaggctctt tttctaccgg aagagrgtcr 
agcacrtgaa gagggtgcag ctgcgggagc 
aagccaggcc cgccctgctg acgtccagac 
ggccgattgt gaacatggac tacgtcgtgg 
ccgagcgrct cacctcgagg gtgaaggcac 
ggcgccccgg cctcctgggc gcctctgtgc 
gcaccttcgt gctgcgtgtg cgggcccagg 
acaggctcac ggaggtcatc gccagcatca 
gtatgccgtg gtccagaagg ccgcccatgg 
ctctaccttg acagacctcc agccgtacat 
cagcccgctg agggatgccg tcgtcatcga 
tggcctcttc gacgtcttcc tacgcttcat 
gtcctacgtc cagtgccagg ggatcccgca 
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6781 gggctccatc ctctccacgc tgctctgcag 
6841 gtttgcgggg attcggcggg acgggctgct 
6901 gacacctcac ctcacccacg cgaaaacctt 
6961 gtatggctgc gtggtgaact tgcggaagac 
7021 cctgggtggc acggcttttg ttcagatgcc 
7081 gctgctggat acccggaccc tggaggtgca 
7141 catcagagcc agtctcacct tcaaccgcgg 
7201 actctttggg gtcttgcggc tgaagtgtca 
7261 cctccagacg gtgtgcacca acatctacaa 
7321 cgcatgtgtg ctgcagctcc catttcatca 
7381 gcgcgtcatc tctgacacgg cctccctctg 
7441 gatgtcgctg ggggccaagg gcgccgccgg 
7501 gtgccaccaa gcattzcctgc tcaagctgac 
7561 ggggtcactc aggacagccc agacgcagct 
7621 tgccctggag gccgcagcca acccggcact 
7681 atctagag 



cctgtgctac ggcgacatgg agaacaagct 
cctgcgtttg gtggatgatt tcttgttggt 
cctcaggacc ctggtccgag gtgtccctga 
agtggtgaac ttccctgtag aagacgaggc 
ggcccacggc ctattcccct ggtgcggcct 
gagcgactac tccagctatg cccggacctc 
cttcaaggct gggaggaaca tgcgtcgcaa 
cagcctgttt ctggatttgc aggtgaacag 
gatcctcctg ctgcaggcgt acaggtttca 
gcaagtttgg aagaacccca catttttcct 
ctactccatc ctgaaagcca agaacgcagg 
ccctctgccc tccgaggccg tgcagtggct 
tcgacaccgt gtcacctacg tgccactcct 
gagtcggaag ctcccgggga cgacgctgac 
gccctcagac ttcaagacca tcctggactg 
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